Illumos #3581 spa_zio_taskq[ZIO_TYPE_FREE][ZIO_TASKQ_ISSUE]->tq_lock contention
[zfs.git] / module / zfs / vdev_file.c
index dc0e920..06999a8 100644 (file)
  * CDDL HEADER END
  */
 /*
- * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
- * Use is subject to license terms.
+ * Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
+ * Copyright (c) 2012 by Delphix. All rights reserved.
  */
 
 #include <sys/zfs_context.h>
 #include <sys/spa.h>
+#include <sys/spa_impl.h>
 #include <sys/vdev_file.h>
 #include <sys/vdev_impl.h>
 #include <sys/zio.h>
  * Virtual device vector for files.
  */
 
+static void
+vdev_file_hold(vdev_t *vd)
+{
+       ASSERT(vd->vdev_path != NULL);
+}
+
+static void
+vdev_file_rele(vdev_t *vd)
+{
+       ASSERT(vd->vdev_path != NULL);
+}
+
 static int
-vdev_file_open(vdev_t *vd, uint64_t *psize, uint64_t *ashift)
+vdev_file_open(vdev_t *vd, uint64_t *psize, uint64_t *max_psize,
+    uint64_t *ashift)
 {
        vdev_file_t *vf;
        vnode_t *vp;
@@ -51,7 +65,17 @@ vdev_file_open(vdev_t *vd, uint64_t *psize, uint64_t *ashift)
                return (EINVAL);
        }
 
-       vf = vd->vdev_tsd = kmem_zalloc(sizeof (vdev_file_t), KM_SLEEP);
+       /*
+        * Reopen the device if it's not currently open.  Otherwise,
+        * just update the physical size of the device.
+        */
+       if (vd->vdev_tsd != NULL) {
+               ASSERT(vd->vdev_reopening);
+               vf = vd->vdev_tsd;
+               goto skip_open;
+       }
+
+       vf = vd->vdev_tsd = kmem_zalloc(sizeof (vdev_file_t), KM_PUSHPAGE);
 
        /*
         * We always open the files from the root of the global zone, even if
@@ -61,7 +85,7 @@ vdev_file_open(vdev_t *vd, uint64_t *psize, uint64_t *ashift)
         */
        ASSERT(vd->vdev_path != NULL && vd->vdev_path[0] == '/');
        error = vn_openat(vd->vdev_path + 1, UIO_SYSSPACE,
-           spa_mode | FOFFMAX, 0, &vp, 0, 0, rootdir, -1);
+           spa_mode(vd->vdev_spa) | FOFFMAX, 0, &vp, 0, 0, rootdir, -1);
 
        if (error) {
                vd->vdev_stat.vs_aux = VDEV_AUX_OPEN_FAILED;
@@ -79,6 +103,8 @@ vdev_file_open(vdev_t *vd, uint64_t *psize, uint64_t *ashift)
                return (ENODEV);
        }
 #endif
+
+skip_open:
        /*
         * Determine the physical size of the file.
         */
@@ -89,7 +115,7 @@ vdev_file_open(vdev_t *vd, uint64_t *psize, uint64_t *ashift)
                return (error);
        }
 
-       *psize = vattr.va_size;
+       *max_psize = *psize = vattr.va_size;
        *ashift = SPA_MINBLOCKSHIFT;
 
        return (0);
@@ -100,25 +126,45 @@ vdev_file_close(vdev_t *vd)
 {
        vdev_file_t *vf = vd->vdev_tsd;
 
-       if (vf == NULL)
+       if (vd->vdev_reopening || vf == NULL)
                return;
 
        if (vf->vf_vnode != NULL) {
                (void) VOP_PUTPAGE(vf->vf_vnode, 0, 0, B_INVAL, kcred, NULL);
-               (void) VOP_CLOSE(vf->vf_vnode, spa_mode, 1, 0, kcred, NULL);
-               VN_RELE(vf->vf_vnode);
+               (void) VOP_CLOSE(vf->vf_vnode, spa_mode(vd->vdev_spa), 1, 0,
+                   kcred, NULL);
        }
 
+       vd->vdev_delayed_close = B_FALSE;
        kmem_free(vf, sizeof (vdev_file_t));
        vd->vdev_tsd = NULL;
 }
 
+static void
+vdev_file_io_strategy(void *arg)
+{
+       zio_t *zio = (zio_t *)arg;
+       vdev_t *vd = zio->io_vd;
+       vdev_file_t *vf = vd->vdev_tsd;
+       ssize_t resid;
+
+       zio->io_error = vn_rdwr(zio->io_type == ZIO_TYPE_READ ?
+           UIO_READ : UIO_WRITE, vf->vf_vnode, zio->io_data,
+           zio->io_size, zio->io_offset, UIO_SYSSPACE,
+           0, RLIM64_INFINITY, kcred, &resid);
+
+       if (resid != 0 && zio->io_error == 0)
+               zio->io_error = ENOSPC;
+
+       zio_interrupt(zio);
+}
+
 static int
 vdev_file_io_start(zio_t *zio)
 {
+       spa_t *spa = zio->io_spa;
        vdev_t *vd = zio->io_vd;
        vdev_file_t *vf = vd->vdev_tsd;
-       ssize_t resid;
 
        if (zio->io_type == ZIO_TYPE_IOCTL) {
                /* XXPOLICY */
@@ -139,15 +185,8 @@ vdev_file_io_start(zio_t *zio)
                return (ZIO_PIPELINE_CONTINUE);
        }
 
-       zio->io_error = vn_rdwr(zio->io_type == ZIO_TYPE_READ ?
-           UIO_READ : UIO_WRITE, vf->vf_vnode, zio->io_data,
-           zio->io_size, zio->io_offset, UIO_SYSSPACE,
-           0, RLIM64_INFINITY, kcred, &resid);
-
-       if (resid != 0 && zio->io_error == 0)
-               zio->io_error = ENOSPC;
-
-       zio_interrupt(zio);
+       spa_taskq_dispatch_ent(spa, ZIO_TYPE_FREE, ZIO_TASKQ_ISSUE,
+           vdev_file_io_strategy, zio, 0, &zio->io_tqent);
 
        return (ZIO_PIPELINE_STOP);
 }
@@ -165,6 +204,8 @@ vdev_ops_t vdev_file_ops = {
        vdev_file_io_start,
        vdev_file_io_done,
        NULL,
+       vdev_file_hold,
+       vdev_file_rele,
        VDEV_TYPE_FILE,         /* name of this vdev type */
        B_TRUE                  /* leaf vdev */
 };
@@ -181,6 +222,8 @@ vdev_ops_t vdev_disk_ops = {
        vdev_file_io_start,
        vdev_file_io_done,
        NULL,
+       vdev_file_hold,
+       vdev_file_rele,
        VDEV_TYPE_DISK,         /* name of this vdev type */
        B_TRUE                  /* leaf vdev */
 };