vdev_file.c revision 297078
1/* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License (the "License"). 6 * You may not use this file except in compliance with the License. 7 * 8 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 9 * or http://www.opensolaris.org/os/licensing. 10 * See the License for the specific language governing permissions 11 * and limitations under the License. 12 * 13 * When distributing Covered Code, include this CDDL HEADER in each 14 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 15 * If applicable, add the following below this CDDL HEADER, with the 16 * fields enclosed by brackets "[]" replaced with your own identifying 17 * information: Portions Copyright [yyyy] [name of copyright owner] 18 * 19 * CDDL HEADER END 20 */ 21/* 22 * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved. 23 * Copyright (c) 2011, 2014 by Delphix. All rights reserved. 24 */ 25 26#include <sys/zfs_context.h> 27#include <sys/spa.h> 28#include <sys/vdev_file.h> 29#include <sys/vdev_impl.h> 30#include <sys/zio.h> 31#include <sys/fs/zfs.h> 32#include <sys/fm/fs/zfs.h> 33 34/* 35 * Virtual device vector for files. 36 */ 37 38static void 39vdev_file_hold(vdev_t *vd) 40{ 41 ASSERT(vd->vdev_path != NULL); 42} 43 44static void 45vdev_file_rele(vdev_t *vd) 46{ 47 ASSERT(vd->vdev_path != NULL); 48} 49 50static int 51vdev_file_open(vdev_t *vd, uint64_t *psize, uint64_t *max_psize, 52 uint64_t *logical_ashift, uint64_t *physical_ashift) 53{ 54 vdev_file_t *vf; 55 vnode_t *vp; 56 vattr_t vattr; 57 int error; 58 59 /* 60 * We must have a pathname, and it must be absolute. 61 */ 62 if (vd->vdev_path == NULL || vd->vdev_path[0] != '/') { 63 vd->vdev_stat.vs_aux = VDEV_AUX_BAD_LABEL; 64 return (SET_ERROR(EINVAL)); 65 } 66 67 /* 68 * Reopen the device if it's not currently open. Otherwise, 69 * just update the physical size of the device. 70 */ 71 if (vd->vdev_tsd != NULL) { 72 ASSERT(vd->vdev_reopening); 73 vf = vd->vdev_tsd; 74 vp = vf->vf_vnode; 75 goto skip_open; 76 } 77 78 vf = vd->vdev_tsd = kmem_zalloc(sizeof (vdev_file_t), KM_SLEEP); 79 80 /* 81 * We always open the files from the root of the global zone, even if 82 * we're in a local zone. If the user has gotten to this point, the 83 * administrator has already decided that the pool should be available 84 * to local zone users, so the underlying devices should be as well. 85 */ 86 ASSERT(vd->vdev_path != NULL && vd->vdev_path[0] == '/'); 87 error = vn_openat(vd->vdev_path + 1, UIO_SYSSPACE, 88 spa_mode(vd->vdev_spa) | FOFFMAX, 0, &vp, 0, 0, rootdir, -1); 89 90 if (error) { 91 vd->vdev_stat.vs_aux = VDEV_AUX_OPEN_FAILED; 92 kmem_free(vd->vdev_tsd, sizeof (vdev_file_t)); 93 vd->vdev_tsd = NULL; 94 return (error); 95 } 96 97 vf->vf_vnode = vp; 98 99#ifdef _KERNEL 100 /* 101 * Make sure it's a regular file. 102 */ 103 if (vp->v_type != VREG) { 104#ifdef __FreeBSD__ 105 (void) VOP_CLOSE(vp, spa_mode(vd->vdev_spa), 1, 0, kcred, NULL); 106#endif 107 vd->vdev_stat.vs_aux = VDEV_AUX_OPEN_FAILED; 108#ifdef __FreeBSD__ 109 kmem_free(vd->vdev_tsd, sizeof (vdev_file_t)); 110 vd->vdev_tsd = NULL; 111#endif 112 return (SET_ERROR(ENODEV)); 113 } 114#endif /* _KERNEL */ 115 116skip_open: 117 /* 118 * Determine the physical size of the file. 119 */ 120 vattr.va_mask = AT_SIZE; 121 vn_lock(vp, LK_SHARED | LK_RETRY); 122 error = VOP_GETATTR(vp, &vattr, kcred); 123 VOP_UNLOCK(vp, 0); 124 if (error) { 125 (void) VOP_CLOSE(vp, spa_mode(vd->vdev_spa), 1, 0, kcred, NULL); 126 vd->vdev_stat.vs_aux = VDEV_AUX_OPEN_FAILED; 127 kmem_free(vd->vdev_tsd, sizeof (vdev_file_t)); 128 vd->vdev_tsd = NULL; 129 return (error); 130 } 131 132 vd->vdev_notrim = B_TRUE; 133 134 *max_psize = *psize = vattr.va_size; 135 *logical_ashift = SPA_MINBLOCKSHIFT; 136 *physical_ashift = SPA_MINBLOCKSHIFT; 137 138 return (0); 139} 140 141static void 142vdev_file_close(vdev_t *vd) 143{ 144 vdev_file_t *vf = vd->vdev_tsd; 145 146 if (vd->vdev_reopening || vf == NULL) 147 return; 148 149 if (vf->vf_vnode != NULL) { 150 (void) VOP_CLOSE(vf->vf_vnode, spa_mode(vd->vdev_spa), 1, 0, 151 kcred, NULL); 152 } 153 154 vd->vdev_delayed_close = B_FALSE; 155 kmem_free(vf, sizeof (vdev_file_t)); 156 vd->vdev_tsd = NULL; 157} 158 159static void 160vdev_file_io_start(zio_t *zio) 161{ 162 vdev_t *vd = zio->io_vd; 163 vdev_file_t *vf; 164 vnode_t *vp; 165 ssize_t resid; 166 167 if (!vdev_readable(vd)) { 168 zio->io_error = SET_ERROR(ENXIO); 169 zio_interrupt(zio); 170 return; 171 } 172 173 vf = vd->vdev_tsd; 174 vp = vf->vf_vnode; 175 176 if (zio->io_type == ZIO_TYPE_IOCTL) { 177 switch (zio->io_cmd) { 178 case DKIOCFLUSHWRITECACHE: 179 zio->io_error = VOP_FSYNC(vp, FSYNC | FDSYNC, 180 kcred, NULL); 181 break; 182 default: 183 zio->io_error = SET_ERROR(ENOTSUP); 184 } 185 186 zio_execute(zio); 187 return; 188 } 189 190 ASSERT(zio->io_type == ZIO_TYPE_READ || zio->io_type == ZIO_TYPE_WRITE); 191 192 zio->io_error = vn_rdwr(zio->io_type == ZIO_TYPE_READ ? 193 UIO_READ : UIO_WRITE, vp, zio->io_data, zio->io_size, 194 zio->io_offset, UIO_SYSSPACE, 0, RLIM64_INFINITY, kcred, &resid); 195 196 if (resid != 0 && zio->io_error == 0) 197 zio->io_error = ENOSPC; 198 199 zio_interrupt(zio); 200 201#ifdef illumos 202 VERIFY3U(taskq_dispatch(system_taskq, vdev_file_io_strategy, bp, 203 TQ_SLEEP), !=, 0); 204#endif 205} 206 207/* ARGSUSED */ 208static void 209vdev_file_io_done(zio_t *zio) 210{ 211} 212 213vdev_ops_t vdev_file_ops = { 214 vdev_file_open, 215 vdev_file_close, 216 vdev_default_asize, 217 vdev_file_io_start, 218 vdev_file_io_done, 219 NULL, 220 vdev_file_hold, 221 vdev_file_rele, 222 VDEV_TYPE_FILE, /* name of this vdev type */ 223 B_TRUE /* leaf vdev */ 224}; 225 226/* 227 * From userland we access disks just like files. 228 */ 229#ifndef _KERNEL 230 231vdev_ops_t vdev_disk_ops = { 232 vdev_file_open, 233 vdev_file_close, 234 vdev_default_asize, 235 vdev_file_io_start, 236 vdev_file_io_done, 237 NULL, 238 vdev_file_hold, 239 vdev_file_rele, 240 VDEV_TYPE_DISK, /* name of this vdev type */ 241 B_TRUE /* leaf vdev */ 242}; 243 244#endif 245