fuse_node.c revision 282960
1204076Spjd/* 2204076Spjd * Copyright (c) 2007-2009 Google Inc. and Amit Singh 3204076Spjd * All rights reserved. 4204076Spjd * 5204076Spjd * Redistribution and use in source and binary forms, with or without 6204076Spjd * modification, are permitted provided that the following conditions are 7204076Spjd * met: 8204076Spjd * 9204076Spjd * * Redistributions of source code must retain the above copyright 10204076Spjd * notice, this list of conditions and the following disclaimer. 11204076Spjd * * Redistributions in binary form must reproduce the above 12204076Spjd * copyright notice, this list of conditions and the following disclaimer 13204076Spjd * in the documentation and/or other materials provided with the 14204076Spjd * distribution. 15204076Spjd * * Neither the name of Google Inc. nor the names of its 16204076Spjd * contributors may be used to endorse or promote products derived from 17204076Spjd * this software without specific prior written permission. 18204076Spjd * 19204076Spjd * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 20204076Spjd * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 21204076Spjd * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 22204076Spjd * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 23204076Spjd * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 24204076Spjd * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 25204076Spjd * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 26204076Spjd * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 27204076Spjd * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 28204076Spjd * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 29204076Spjd * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 30204076Spjd * 31204076Spjd * Copyright (C) 2005 Csaba Henk. 32204076Spjd * All rights reserved. 33204076Spjd * 34204076Spjd * Redistribution and use in source and binary forms, with or without 35204076Spjd * modification, are permitted provided that the following conditions 36204076Spjd * are met: 37204076Spjd * 1. Redistributions of source code must retain the above copyright 38204076Spjd * notice, this list of conditions and the following disclaimer. 39204076Spjd * 2. Redistributions in binary form must reproduce the above copyright 40204076Spjd * notice, this list of conditions and the following disclaimer in the 41204076Spjd * documentation and/or other materials provided with the distribution. 42204076Spjd * 43204076Spjd * THIS SOFTWARE IS PROVIDED BY AUTHOR AND CONTRIBUTORS ``AS IS'' AND 44204076Spjd * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 45204076Spjd * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 46204076Spjd * ARE DISCLAIMED. IN NO EVENT SHALL AUTHOR OR CONTRIBUTORS BE LIABLE 47204076Spjd * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 48204076Spjd * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 49204076Spjd * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 50204076Spjd * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 51204076Spjd * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 52204076Spjd * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 53204076Spjd * SUCH DAMAGE. 54204076Spjd */ 55204076Spjd 56204076Spjd#include <sys/cdefs.h> 57204076Spjd__FBSDID("$FreeBSD: stable/10/sys/fs/fuse/fuse_node.c 282960 2015-05-15 11:03:19Z trasz $"); 58204076Spjd 59204076Spjd#include <sys/types.h> 60204076Spjd#include <sys/module.h> 61204076Spjd#include <sys/systm.h> 62204076Spjd#include <sys/errno.h> 63204076Spjd#include <sys/param.h> 64204076Spjd#include <sys/kernel.h> 65204076Spjd#include <sys/conf.h> 66204076Spjd#include <sys/uio.h> 67204076Spjd#include <sys/malloc.h> 68204076Spjd#include <sys/queue.h> 69204076Spjd#include <sys/lock.h> 70204076Spjd#include <sys/sx.h> 71204076Spjd#include <sys/mutex.h> 72204076Spjd#include <sys/proc.h> 73204076Spjd#include <sys/vnode.h> 74204076Spjd#include <sys/namei.h> 75204076Spjd#include <sys/mount.h> 76204076Spjd#include <sys/sysctl.h> 77204076Spjd#include <sys/fcntl.h> 78204076Spjd#include <sys/fnv_hash.h> 79204076Spjd#include <sys/priv.h> 80204076Spjd#include <security/mac/mac_framework.h> 81204076Spjd#include <vm/vm.h> 82204076Spjd#include <vm/vm_extern.h> 83204076Spjd 84204076Spjd#include "fuse.h" 85204076Spjd#include "fuse_node.h" 86204076Spjd#include "fuse_internal.h" 87204076Spjd#include "fuse_io.h" 88204076Spjd#include "fuse_ipc.h" 89204076Spjd 90204076Spjd#define FUSE_DEBUG_MODULE VNOPS 91204076Spjd#include "fuse_debug.h" 92204076Spjd 93204076SpjdMALLOC_DEFINE(M_FUSEVN, "fuse_vnode", "fuse vnode private data"); 94204076Spjd 95204076Spjdstatic int fuse_node_count = 0; 96204076Spjd 97204076SpjdSYSCTL_INT(_vfs_fuse, OID_AUTO, node_count, CTLFLAG_RD, 98204076Spjd &fuse_node_count, 0, ""); 99204076Spjd 100204076Spjdint fuse_data_cache_enable = 1; 101204076Spjd 102204076SpjdSYSCTL_INT(_vfs_fuse, OID_AUTO, data_cache_enable, CTLFLAG_RW, 103204076Spjd &fuse_data_cache_enable, 0, ""); 104204076Spjd 105204076Spjdint fuse_data_cache_invalidate = 0; 106204076Spjd 107204076SpjdSYSCTL_INT(_vfs_fuse, OID_AUTO, data_cache_invalidate, CTLFLAG_RW, 108204076Spjd &fuse_data_cache_invalidate, 0, ""); 109204076Spjd 110204076Spjdint fuse_mmap_enable = 1; 111204076Spjd 112204076SpjdSYSCTL_INT(_vfs_fuse, OID_AUTO, mmap_enable, CTLFLAG_RW, 113204076Spjd &fuse_mmap_enable, 0, ""); 114204076Spjd 115204076Spjdint fuse_refresh_size = 0; 116204076Spjd 117204076SpjdSYSCTL_INT(_vfs_fuse, OID_AUTO, refresh_size, CTLFLAG_RW, 118204076Spjd &fuse_refresh_size, 0, ""); 119204076Spjd 120204076Spjdint fuse_sync_resize = 1; 121204076Spjd 122204076SpjdSYSCTL_INT(_vfs_fuse, OID_AUTO, sync_resize, CTLFLAG_RW, 123204076Spjd &fuse_sync_resize, 0, ""); 124204076Spjd 125204076Spjdint fuse_fix_broken_io = 0; 126204076Spjd 127204076SpjdSYSCTL_INT(_vfs_fuse, OID_AUTO, fix_broken_io, CTLFLAG_RW, 128204076Spjd &fuse_fix_broken_io, 0, ""); 129204076Spjd 130204076Spjdstatic void 131204076Spjdfuse_vnode_init(struct vnode *vp, struct fuse_vnode_data *fvdat, 132204076Spjd uint64_t nodeid, enum vtype vtyp) 133204076Spjd{ 134204076Spjd int i; 135204076Spjd 136204076Spjd fvdat->nid = nodeid; 137204076Spjd if (nodeid == FUSE_ROOT_ID) { 138204076Spjd vp->v_vflag |= VV_ROOT; 139204076Spjd } 140204076Spjd vp->v_type = vtyp; 141204076Spjd vp->v_data = fvdat; 142204076Spjd 143204076Spjd for (i = 0; i < FUFH_MAXTYPE; i++) 144204076Spjd fvdat->fufh[i].fh_type = FUFH_INVALID; 145204076Spjd 146204076Spjd atomic_add_acq_int(&fuse_node_count, 1); 147204076Spjd} 148204076Spjd 149204076Spjdvoid 150204076Spjdfuse_vnode_destroy(struct vnode *vp) 151204076Spjd{ 152204076Spjd struct fuse_vnode_data *fvdat = vp->v_data; 153204076Spjd 154204076Spjd vp->v_data = NULL; 155204076Spjd free(fvdat, M_FUSEVN); 156204076Spjd 157204076Spjd atomic_subtract_acq_int(&fuse_node_count, 1); 158204076Spjd} 159204076Spjd 160204076Spjdstatic int 161204076Spjdfuse_vnode_cmp(struct vnode *vp, void *nidp) 162204076Spjd{ 163204076Spjd return (VTOI(vp) != *((uint64_t *)nidp)); 164204076Spjd} 165204076Spjd 166204076Spjdstatic uint32_t __inline 167204076Spjdfuse_vnode_hash(uint64_t id) 168204076Spjd{ 169204076Spjd return (fnv_32_buf(&id, sizeof(id), FNV1_32_INIT)); 170204076Spjd} 171204076Spjd 172204076Spjdstatic int 173204076Spjdfuse_vnode_alloc(struct mount *mp, 174204076Spjd struct thread *td, 175204076Spjd uint64_t nodeid, 176204076Spjd enum vtype vtyp, 177204076Spjd struct vnode **vpp) 178204076Spjd{ 179204076Spjd struct fuse_vnode_data *fvdat; 180204076Spjd struct vnode *vp2; 181204076Spjd int err = 0; 182204076Spjd 183204076Spjd FS_DEBUG("been asked for vno #%ju\n", (uintmax_t)nodeid); 184204076Spjd 185204076Spjd if (vtyp == VNON) { 186204076Spjd return EINVAL; 187204076Spjd } 188204076Spjd *vpp = NULL; 189204076Spjd err = vfs_hash_get(mp, fuse_vnode_hash(nodeid), LK_EXCLUSIVE, td, vpp, 190204076Spjd fuse_vnode_cmp, &nodeid); 191 if (err) 192 return (err); 193 194 if (*vpp) { 195 MPASS((*vpp)->v_type == vtyp && (*vpp)->v_data != NULL); 196 FS_DEBUG("vnode taken from hash\n"); 197 return (0); 198 } 199 fvdat = malloc(sizeof(*fvdat), M_FUSEVN, M_WAITOK | M_ZERO); 200 err = getnewvnode("fuse", mp, &fuse_vnops, vpp); 201 if (err) { 202 free(fvdat, M_FUSEVN); 203 return (err); 204 } 205 lockmgr((*vpp)->v_vnlock, LK_EXCLUSIVE, NULL); 206 fuse_vnode_init(*vpp, fvdat, nodeid, vtyp); 207 err = insmntque(*vpp, mp); 208 ASSERT_VOP_ELOCKED(*vpp, "fuse_vnode_alloc"); 209 if (err) { 210 free(fvdat, M_FUSEVN); 211 *vpp = NULL; 212 return (err); 213 } 214 err = vfs_hash_insert(*vpp, fuse_vnode_hash(nodeid), LK_EXCLUSIVE, 215 td, &vp2, fuse_vnode_cmp, &nodeid); 216 if (err) 217 return (err); 218 if (vp2 != NULL) { 219 *vpp = vp2; 220 return (0); 221 } 222 223 ASSERT_VOP_ELOCKED(*vpp, "fuse_vnode_alloc"); 224 225 return (0); 226} 227 228int 229fuse_vnode_get(struct mount *mp, 230 uint64_t nodeid, 231 struct vnode *dvp, 232 struct vnode **vpp, 233 struct componentname *cnp, 234 enum vtype vtyp) 235{ 236 struct thread *td = (cnp != NULL ? cnp->cn_thread : curthread); 237 int err = 0; 238 239 debug_printf("dvp=%p\n", dvp); 240 241 err = fuse_vnode_alloc(mp, td, nodeid, vtyp, vpp); 242 if (err) { 243 return err; 244 } 245 if (dvp != NULL) { 246 MPASS((cnp->cn_flags & ISDOTDOT) == 0); 247 MPASS(!(cnp->cn_namelen == 1 && cnp->cn_nameptr[0] == '.')); 248 fuse_vnode_setparent(*vpp, dvp); 249 } 250 if (dvp != NULL && cnp != NULL && (cnp->cn_flags & MAKEENTRY) != 0) { 251 ASSERT_VOP_LOCKED(*vpp, "fuse_vnode_get"); 252 ASSERT_VOP_LOCKED(dvp, "fuse_vnode_get"); 253 cache_enter(dvp, *vpp, cnp); 254 } 255 256 /* 257 * In userland, libfuse uses cached lookups for dot and dotdot entries, 258 * thus it does not really bump the nlookup counter for forget. 259 * Follow the same semantic and avoid tu bump it in order to keep 260 * nlookup counters consistent. 261 */ 262 if (cnp == NULL || ((cnp->cn_flags & ISDOTDOT) == 0 && 263 (cnp->cn_namelen != 1 || cnp->cn_nameptr[0] != '.'))) 264 VTOFUD(*vpp)->nlookup++; 265 266 return 0; 267} 268 269void 270fuse_vnode_open(struct vnode *vp, int32_t fuse_open_flags, struct thread *td) 271{ 272 /* 273 * Funcation is called for every vnode open. 274 * Merge fuse_open_flags it may be 0 275 * 276 * XXXIP: Handle FOPEN_KEEP_CACHE 277 */ 278 /* 279 * Ideally speaking, direct io should be enabled on 280 * fd's but do not see of any way of providing that 281 * this implementation. 282 283 * Also cannot think of a reason why would two 284 * different fd's on same vnode would like 285 * have DIRECT_IO turned on and off. But linux 286 * based implementation works on an fd not an 287 * inode and provides such a feature. 288 * 289 * XXXIP: Handle fd based DIRECT_IO 290 */ 291 if (fuse_open_flags & FOPEN_DIRECT_IO) { 292 VTOFUD(vp)->flag |= FN_DIRECTIO; 293 } else { 294 VTOFUD(vp)->flag &= ~FN_DIRECTIO; 295 } 296 297 if (vnode_vtype(vp) == VREG) { 298 /* XXXIP prevent getattr, by using cached node size */ 299 vnode_create_vobject(vp, 0, td); 300 } 301} 302 303int 304fuse_vnode_savesize(struct vnode *vp, struct ucred *cred) 305{ 306 struct fuse_vnode_data *fvdat = VTOFUD(vp); 307 struct thread *td = curthread; 308 struct fuse_filehandle *fufh = NULL; 309 struct fuse_dispatcher fdi; 310 struct fuse_setattr_in *fsai; 311 int err = 0; 312 313 FS_DEBUG("inode=%ju size=%ju\n", (uintmax_t)VTOI(vp), 314 (uintmax_t)fvdat->filesize); 315 ASSERT_VOP_ELOCKED(vp, "fuse_io_extend"); 316 317 if (fuse_isdeadfs(vp)) { 318 return EBADF; 319 } 320 if (vnode_vtype(vp) == VDIR) { 321 return EISDIR; 322 } 323 if (vfs_isrdonly(vnode_mount(vp))) { 324 return EROFS; 325 } 326 if (cred == NULL) { 327 cred = td->td_ucred; 328 } 329 fdisp_init(&fdi, sizeof(*fsai)); 330 fdisp_make_vp(&fdi, FUSE_SETATTR, vp, td, cred); 331 fsai = fdi.indata; 332 fsai->valid = 0; 333 334 /* Truncate to a new value. */ 335 fsai->size = fvdat->filesize; 336 fsai->valid |= FATTR_SIZE; 337 338 fuse_filehandle_getrw(vp, FUFH_WRONLY, &fufh); 339 if (fufh) { 340 fsai->fh = fufh->fh_id; 341 fsai->valid |= FATTR_FH; 342 } 343 err = fdisp_wait_answ(&fdi); 344 fdisp_destroy(&fdi); 345 if (err == 0) 346 fvdat->flag &= ~FN_SIZECHANGE; 347 348 return err; 349} 350 351void 352fuse_vnode_refreshsize(struct vnode *vp, struct ucred *cred) 353{ 354 355 struct fuse_vnode_data *fvdat = VTOFUD(vp); 356 struct vattr va; 357 358 if ((fvdat->flag & FN_SIZECHANGE) != 0 || 359 (fuse_refresh_size == 0 && fvdat->filesize != 0)) 360 return; 361 362 VOP_GETATTR(vp, &va, cred); 363 FS_DEBUG("refreshed file size: %jd\n", (intmax_t)VTOFUD(vp)->filesize); 364} 365 366int 367fuse_vnode_setsize(struct vnode *vp, struct ucred *cred, off_t newsize) 368{ 369 struct fuse_vnode_data *fvdat = VTOFUD(vp); 370 off_t oldsize; 371 int err = 0; 372 373 FS_DEBUG("inode=%ju oldsize=%ju newsize=%ju\n", 374 (uintmax_t)VTOI(vp), (uintmax_t)fvdat->filesize, 375 (uintmax_t)newsize); 376 ASSERT_VOP_ELOCKED(vp, "fuse_vnode_setsize"); 377 378 oldsize = fvdat->filesize; 379 fvdat->filesize = newsize; 380 fvdat->flag |= FN_SIZECHANGE; 381 382 if (newsize < oldsize) { 383 err = vtruncbuf(vp, cred, newsize, fuse_iosize(vp)); 384 } 385 vnode_pager_setsize(vp, newsize); 386 return err; 387} 388