Skip to content

Commit

Permalink
Illumos openzfs#5244 zio pipeline callers should explicitly invoke ne…
Browse files Browse the repository at this point in the history
…xt stage openzfs#2828

References:
https://www.illumos.org/projects/illumos-gate//issues/5244
https://reviews.csiden.org/r/119/diff/#

Porting Notes:
1. The unported "2932 support crash dumps to raidz, etc. pools" caused a
merge conflict due to a copyright difference in module/zfs/vdev_raidz.c.
2. The unported "4128 disks in zpools never go away when pulled" and
additional Linux-specific changes caused merge conflicts in
module/zfs/vdev_disk.c.
3. Our changes to use the TQ_PUSHPAGE extension and vdev_file_taskq
caused merge conflicts in module/zfs/vdev_file.c. The taskq import that
I plan to send in the future would have prevented this particular
conflict.

Reviewed by: Matthew Ahrens [email protected]
Reviewed by: Adam Leventhal [email protected]
Reviewed by: Alex Reece [email protected]
Reviewed by: Christopher Siden [email protected]
Ported-by: Richard Yao [email protected]
  • Loading branch information
ryao authored and kernelOfTruth committed Dec 13, 2014
1 parent a691832 commit db0ccb3
Show file tree
Hide file tree
Showing 9 changed files with 55 additions and 33 deletions.
2 changes: 1 addition & 1 deletion include/sys/vdev_impl.h
Original file line number Diff line number Diff line change
Expand Up @@ -61,7 +61,7 @@ typedef int vdev_open_func_t(vdev_t *vd, uint64_t *size, uint64_t *max_size,
uint64_t *ashift);
typedef void vdev_close_func_t(vdev_t *vd);
typedef uint64_t vdev_asize_func_t(vdev_t *vd, uint64_t psize);
typedef int vdev_io_start_func_t(zio_t *zio);
typedef void vdev_io_start_func_t(zio_t *zio);
typedef void vdev_io_done_func_t(zio_t *zio);
typedef void vdev_state_change_func_t(vdev_t *vd, int, int);
typedef void vdev_hold_func_t(vdev_t *vd);
Expand Down
3 changes: 0 additions & 3 deletions include/sys/zio.h
Original file line number Diff line number Diff line change
Expand Up @@ -154,9 +154,6 @@ typedef enum zio_priority {
ZIO_PRIORITY_NOW /* non-queued i/os (e.g. free) */
} zio_priority_t;

#define ZIO_PIPELINE_CONTINUE 0x100
#define ZIO_PIPELINE_STOP 0x101

enum zio_flag {
/*
* Flags inherited by gang, ddt, and vdev children,
Expand Down
4 changes: 4 additions & 0 deletions lib/libzpool/taskq.c
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,7 @@
/*
* Copyright 2011 Nexenta Systems, Inc. All rights reserved.
* Copyright 2012 Garrett D'Amore <[email protected]>. All rights reserved.
* Copyright (c) 2014 by Delphix. All rights reserved.
*/

#include <sys/zfs_context.h>
Expand All @@ -33,8 +34,10 @@ int taskq_now;
taskq_t *system_taskq;

#define TASKQ_ACTIVE 0x00010000
#define TASKQ_NAMELEN 31

struct taskq {
char tq_name[TASKQ_NAMELEN + 1];
kmutex_t tq_lock;
krwlock_t tq_threadlock;
kcondvar_t tq_dispatch_cv;
Expand Down Expand Up @@ -280,6 +283,7 @@ taskq_create(const char *name, int nthreads, pri_t pri,
cv_init(&tq->tq_dispatch_cv, NULL, CV_DEFAULT, NULL);
cv_init(&tq->tq_wait_cv, NULL, CV_DEFAULT, NULL);
cv_init(&tq->tq_maxalloc_cv, NULL, CV_DEFAULT, NULL);
(void) strncpy(tq->tq_name, name, TASKQ_NAMELEN + 1);
tq->tq_flags = flags | TASKQ_ACTIVE;
tq->tq_active = nthreads;
tq->tq_nthreads = nthreads;
Expand Down
20 changes: 11 additions & 9 deletions module/zfs/vdev_disk.c
Original file line number Diff line number Diff line change
Expand Up @@ -665,7 +665,7 @@ vdev_disk_io_flush(struct block_device *bdev, zio_t *zio)
return (0);
}

static int
static void
vdev_disk_io_start(zio_t *zio)
{
vdev_t *v = zio->io_vd;
Expand All @@ -677,7 +677,9 @@ vdev_disk_io_start(zio_t *zio)

if (!vdev_readable(v)) {
zio->io_error = SET_ERROR(ENXIO);
return (ZIO_PIPELINE_CONTINUE);
zio_interrupt(zio);
return;

}

switch (zio->io_cmd) {
Expand All @@ -693,7 +695,7 @@ vdev_disk_io_start(zio_t *zio)

error = vdev_disk_io_flush(vd->vd_bdev, zio);
if (error == 0)
return (ZIO_PIPELINE_STOP);
return;

zio->io_error = error;
if (error == ENOTSUP)
Expand All @@ -705,8 +707,8 @@ vdev_disk_io_start(zio_t *zio)
zio->io_error = SET_ERROR(ENOTSUP);
}

return (ZIO_PIPELINE_CONTINUE);

zio_execute(zio);
return;
case ZIO_TYPE_WRITE:
flags = WRITE;
break;
Expand All @@ -717,17 +719,17 @@ vdev_disk_io_start(zio_t *zio)

default:
zio->io_error = SET_ERROR(ENOTSUP);
return (ZIO_PIPELINE_CONTINUE);
zio_interrupt(zio);
return;
}

error = __vdev_disk_physio(vd->vd_bdev, zio, NULL,
zio->io_size, zio->io_offset, flags);
if (error) {
zio->io_error = error;
return (ZIO_PIPELINE_CONTINUE);
zio_interrupt(zio);
return;
}

return (ZIO_PIPELINE_STOP);
}

static void
Expand Down
12 changes: 6 additions & 6 deletions module/zfs/vdev_file.c
Original file line number Diff line number Diff line change
Expand Up @@ -20,7 +20,7 @@
*/
/*
* Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
* Copyright (c) 2013 by Delphix. All rights reserved.
* Copyright (c) 2011, 2014 by Delphix. All rights reserved.
*/

#include <sys/zfs_context.h>
Expand Down Expand Up @@ -172,7 +172,7 @@ vdev_file_io_strategy(void *arg)
zio_interrupt(zio);
}

static int
static void
vdev_file_io_start(zio_t *zio)
{
vdev_t *vd = zio->io_vd;
Expand All @@ -182,7 +182,8 @@ vdev_file_io_start(zio_t *zio)
/* XXPOLICY */
if (!vdev_readable(vd)) {
zio->io_error = SET_ERROR(ENXIO);
return (ZIO_PIPELINE_CONTINUE);
zio_interrupt(zio);
return;
}

switch (zio->io_cmd) {
Expand All @@ -198,13 +199,12 @@ vdev_file_io_start(zio_t *zio)
zio->io_error = SET_ERROR(ENOTSUP);
}

return (ZIO_PIPELINE_CONTINUE);
zio_execute(zio);
return;
}

VERIFY3U(taskq_dispatch(vdev_file_taskq, vdev_file_io_strategy, zio,
TQ_PUSHPAGE), !=, 0);

return (ZIO_PIPELINE_STOP);
}

/* ARGSUSED */
Expand Down
9 changes: 5 additions & 4 deletions module/zfs/vdev_mirror.c
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,7 @@
*/

/*
* Copyright (c) 2013 by Delphix. All rights reserved.
* Copyright (c) 2012, 2014 by Delphix. All rights reserved.
*/

#include <sys/zfs_context.h>
Expand Down Expand Up @@ -329,7 +329,7 @@ vdev_mirror_child_select(zio_t *zio)
return (-1);
}

static int
static void
vdev_mirror_io_start(zio_t *zio)
{
mirror_map_t *mm;
Expand Down Expand Up @@ -361,7 +361,8 @@ vdev_mirror_io_start(zio_t *zio)
zio->io_type, zio->io_priority, 0,
vdev_mirror_scrub_done, mc));
}
return (ZIO_PIPELINE_CONTINUE);
zio_execute(zio);
return;
}
/*
* For normal reads just pick one child.
Expand All @@ -387,7 +388,7 @@ vdev_mirror_io_start(zio_t *zio)
c++;
}

return (ZIO_PIPELINE_CONTINUE);
zio_execute(zio);
}

static int
Expand Down
6 changes: 3 additions & 3 deletions module/zfs/vdev_missing.c
Original file line number Diff line number Diff line change
Expand Up @@ -24,7 +24,7 @@
*/

/*
* Copyright (c) 2013 by Delphix. All rights reserved.
* Copyright (c) 2012, 2014 by Delphix. All rights reserved.
*/

/*
Expand Down Expand Up @@ -66,11 +66,11 @@ vdev_missing_close(vdev_t *vd)
}

/* ARGSUSED */
static int
static void
vdev_missing_io_start(zio_t *zio)
{
zio->io_error = SET_ERROR(ENOTSUP);
return (ZIO_PIPELINE_CONTINUE);
zio_execute(zio);
}

/* ARGSUSED */
Expand Down
9 changes: 5 additions & 4 deletions module/zfs/vdev_raidz.c
Original file line number Diff line number Diff line change
Expand Up @@ -21,7 +21,7 @@

/*
* Copyright (c) 2005, 2010, Oracle and/or its affiliates. All rights reserved.
* Copyright (c) 2013 by Delphix. All rights reserved.
* Copyright (c) 2012, 2014 by Delphix. All rights reserved.
*/

#include <sys/zfs_context.h>
Expand Down Expand Up @@ -1716,7 +1716,7 @@ vdev_raidz_child_done(zio_t *zio)
* vdevs have had errors, then create zio read operations to the parity
* columns' VDevs as well.
*/
static int
static void
vdev_raidz_io_start(zio_t *zio)
{
vdev_t *vd = zio->io_vd;
Expand Down Expand Up @@ -1760,7 +1760,8 @@ vdev_raidz_io_start(zio_t *zio)
ZIO_FLAG_NODATA | ZIO_FLAG_OPTIONAL, NULL, NULL));
}

return (ZIO_PIPELINE_CONTINUE);
zio_execute(zio);
return;
}

ASSERT(zio->io_type == ZIO_TYPE_READ);
Expand Down Expand Up @@ -1800,7 +1801,7 @@ vdev_raidz_io_start(zio_t *zio)
}
}

return (ZIO_PIPELINE_CONTINUE);
zio_execute(zio);
}


Expand Down
23 changes: 20 additions & 3 deletions module/zfs/zio.c
Original file line number Diff line number Diff line change
Expand Up @@ -61,6 +61,9 @@ kmem_cache_t *zio_data_buf_cache[SPA_MAXBLOCKSIZE >> SPA_MINBLOCKSHIFT];
int zio_bulk_flags = 0;
int zio_delay_max = ZIO_DELAY_MAX;

#define ZIO_PIPELINE_CONTINUE 0x100
#define ZIO_PIPELINE_STOP 0x101

/*
* The following actions directly effect the spa's sync-to-convergence logic.
* The values below define the sync pass when we start performing the action.
Expand Down Expand Up @@ -2677,6 +2680,18 @@ zio_free_zil(spa_t *spa, uint64_t txg, blkptr_t *bp)
* Read and write to physical devices
* ==========================================================================
*/


/*
* Issue an I/O to the underlying vdev. Typically the issue pipeline
* stops after this stage and will resume upon I/O completion.
* However, there are instances where the vdev layer may need to
* continue the pipeline when an I/O was not issued. Since the I/O
* that was sent to the vdev layer might be different than the one
* currently active in the pipeline (see vdev_queue_io()), we explicitly
* force the underlying vdev layers to call either zio_execute() or
* zio_interrupt() to ensure that the pipeline continues with the correct I/O.
*/
static int
zio_vdev_io_start(zio_t *zio)
{
Expand All @@ -2694,15 +2709,16 @@ zio_vdev_io_start(zio_t *zio)
/*
* The mirror_ops handle multiple DVAs in a single BP.
*/
return (vdev_mirror_ops.vdev_op_io_start(zio));
vdev_mirror_ops.vdev_op_io_start(zio);
return (ZIO_PIPELINE_STOP);
}

/*
* We keep track of time-sensitive I/Os so that the scan thread
* can quickly react to certain workloads. In particular, we care
* about non-scrubbing, top-level reads and writes with the following
* characteristics:
* - synchronous writes of user data to non-slog devices
* - synchronous writes of user data to non-slog devices
* - any reads of user data
* When these conditions are met, adjust the timestamp of spa_last_io
* which allows the scan thread to adjust its workload accordingly.
Expand Down Expand Up @@ -2792,7 +2808,8 @@ zio_vdev_io_start(zio_t *zio)
}
}

return (vd->vdev_ops->vdev_op_io_start(zio));
vd->vdev_ops->vdev_op_io_start(zio);
return (ZIO_PIPELINE_STOP);
}

static int
Expand Down

0 comments on commit db0ccb3

Please sign in to comment.