mirror of
https://git.proxmox.com/git/mirror_zfs.git
synced 2025-01-27 18:34:22 +03:00
Fixes and enhancements of SIMD raidz parity
- Implementation lock replaced with atomic variable - Trailing whitespace is removed from user specified parameter, to enhance experience when using commands that add newline, e.g. `echo` - raidz_test: remove dependency on `getrusage()` and RUSAGE_THREAD, Issue #4813 - silence `cppcheck` in vdev_raidz, partial solution of Issue #1392 - Minor fixes and cleanups - Enable use of original parity methods in [fastest] configuration. New opaque original ops structure, representing native methods, is added to supported raidz methods. Original parity methods are executed if selected implementation has NULL fn pointer. Signed-off-by: Gvozden Neskovic <neskovic@gmail.com> Signed-off-by: Brian Behlendorf <behlendorf1@llnl.gov> Issue #4813 Issue #1392
This commit is contained in:
parent
1d9b3bd8fb
commit
c9187d867f
@ -32,7 +32,6 @@
|
|||||||
#include <stdio.h>
|
#include <stdio.h>
|
||||||
|
|
||||||
#include <sys/time.h>
|
#include <sys/time.h>
|
||||||
#include <sys/resource.h>
|
|
||||||
|
|
||||||
#include "raidz_test.h"
|
#include "raidz_test.h"
|
||||||
|
|
||||||
@ -42,7 +41,6 @@
|
|||||||
#define MIN_CS_SHIFT BENCH_ASHIFT
|
#define MIN_CS_SHIFT BENCH_ASHIFT
|
||||||
#define MAX_CS_SHIFT SPA_MAXBLOCKSHIFT
|
#define MAX_CS_SHIFT SPA_MAXBLOCKSHIFT
|
||||||
|
|
||||||
|
|
||||||
static zio_t zio_bench;
|
static zio_t zio_bench;
|
||||||
static raidz_map_t *rm_bench;
|
static raidz_map_t *rm_bench;
|
||||||
static size_t max_data_size = SPA_MAXBLOCKSIZE;
|
static size_t max_data_size = SPA_MAXBLOCKSIZE;
|
||||||
@ -70,28 +68,18 @@ bench_fini_raidz_maps(void)
|
|||||||
bzero(&zio_bench, sizeof (zio_t));
|
bzero(&zio_bench, sizeof (zio_t));
|
||||||
}
|
}
|
||||||
|
|
||||||
static double
|
|
||||||
get_time_diff(struct rusage *start, struct rusage *stop)
|
|
||||||
{
|
|
||||||
return (((double)stop->ru_utime.tv_sec * (double)MICROSEC +
|
|
||||||
(double)stop->ru_utime.tv_usec) -
|
|
||||||
((double)start->ru_utime.tv_sec * (double)MICROSEC +
|
|
||||||
(double)start->ru_utime.tv_usec)) / (double)MICROSEC;
|
|
||||||
}
|
|
||||||
|
|
||||||
static inline void
|
static inline void
|
||||||
run_gen_bench_impl(const char *impl)
|
run_gen_bench_impl(const char *impl)
|
||||||
{
|
{
|
||||||
int fn, ncols;
|
int fn, ncols;
|
||||||
uint64_t ds, iter_cnt, iter, disksize;
|
uint64_t ds, iter_cnt, iter, disksize;
|
||||||
struct rusage start, stop;
|
hrtime_t start;
|
||||||
double elapsed, d_bw;
|
double elapsed, d_bw;
|
||||||
|
|
||||||
/* Benchmark generate functions */
|
/* Benchmark generate functions */
|
||||||
for (fn = 0; fn < RAIDZ_GEN_NUM; fn++) {
|
for (fn = 0; fn < RAIDZ_GEN_NUM; fn++) {
|
||||||
|
|
||||||
for (ds = MIN_CS_SHIFT; ds <= MAX_CS_SHIFT; ds++) {
|
for (ds = MIN_CS_SHIFT; ds <= MAX_CS_SHIFT; ds++) {
|
||||||
|
|
||||||
/* create suitable raidz_map */
|
/* create suitable raidz_map */
|
||||||
ncols = rto_opts.rto_dcols + fn + 1;
|
ncols = rto_opts.rto_dcols + fn + 1;
|
||||||
zio_bench.io_size = 1ULL << ds;
|
zio_bench.io_size = 1ULL << ds;
|
||||||
@ -102,12 +90,11 @@ run_gen_bench_impl(const char *impl)
|
|||||||
iter_cnt = GEN_BENCH_MEMORY;
|
iter_cnt = GEN_BENCH_MEMORY;
|
||||||
iter_cnt /= zio_bench.io_size;
|
iter_cnt /= zio_bench.io_size;
|
||||||
|
|
||||||
getrusage(RUSAGE_THREAD, &start);
|
start = gethrtime();
|
||||||
for (iter = 0; iter < iter_cnt; iter++)
|
for (iter = 0; iter < iter_cnt; iter++)
|
||||||
vdev_raidz_generate_parity(rm_bench);
|
vdev_raidz_generate_parity(rm_bench);
|
||||||
getrusage(RUSAGE_THREAD, &stop);
|
elapsed = NSEC2SEC((double) (gethrtime() - start));
|
||||||
|
|
||||||
elapsed = get_time_diff(&start, &stop);
|
|
||||||
disksize = (1ULL << ds) / rto_opts.rto_dcols;
|
disksize = (1ULL << ds) / rto_opts.rto_dcols;
|
||||||
d_bw = (double)iter_cnt * (double)disksize;
|
d_bw = (double)iter_cnt * (double)disksize;
|
||||||
d_bw /= (1024.0 * 1024.0 * elapsed);
|
d_bw /= (1024.0 * 1024.0 * elapsed);
|
||||||
@ -147,9 +134,9 @@ run_gen_bench(void)
|
|||||||
static void
|
static void
|
||||||
run_rec_bench_impl(const char *impl)
|
run_rec_bench_impl(const char *impl)
|
||||||
{
|
{
|
||||||
struct rusage start, stop;
|
|
||||||
int fn, ncols, nbad;
|
int fn, ncols, nbad;
|
||||||
uint64_t ds, iter_cnt, iter, disksize;
|
uint64_t ds, iter_cnt, iter, disksize;
|
||||||
|
hrtime_t start;
|
||||||
double elapsed, d_bw;
|
double elapsed, d_bw;
|
||||||
static const int tgt[7][3] = {
|
static const int tgt[7][3] = {
|
||||||
{1, 2, 3}, /* rec_p: bad QR & D[0] */
|
{1, 2, 3}, /* rec_p: bad QR & D[0] */
|
||||||
@ -187,12 +174,11 @@ run_rec_bench_impl(const char *impl)
|
|||||||
nbad = MIN(3, raidz_ncols(rm_bench) -
|
nbad = MIN(3, raidz_ncols(rm_bench) -
|
||||||
raidz_parity(rm_bench));
|
raidz_parity(rm_bench));
|
||||||
|
|
||||||
getrusage(RUSAGE_THREAD, &start);
|
start = gethrtime();
|
||||||
for (iter = 0; iter < iter_cnt; iter++)
|
for (iter = 0; iter < iter_cnt; iter++)
|
||||||
vdev_raidz_reconstruct(rm_bench, tgt[fn], nbad);
|
vdev_raidz_reconstruct(rm_bench, tgt[fn], nbad);
|
||||||
getrusage(RUSAGE_THREAD, &stop);
|
elapsed = NSEC2SEC((double) (gethrtime() - start));
|
||||||
|
|
||||||
elapsed = get_time_diff(&start, &stop);
|
|
||||||
disksize = (1ULL << ds) / rto_opts.rto_dcols;
|
disksize = (1ULL << ds) / rto_opts.rto_dcols;
|
||||||
d_bw = (double)iter_cnt * (double)(disksize);
|
d_bw = (double)iter_cnt * (double)(disksize);
|
||||||
d_bw /= (1024.0 * 1024.0 * elapsed);
|
d_bw /= (1024.0 * 1024.0 * elapsed);
|
||||||
|
@ -51,10 +51,10 @@ int vdev_raidz_reconstruct(struct raidz_map *, const int *, int);
|
|||||||
*/
|
*/
|
||||||
void vdev_raidz_math_init(void);
|
void vdev_raidz_math_init(void);
|
||||||
void vdev_raidz_math_fini(void);
|
void vdev_raidz_math_fini(void);
|
||||||
void vdev_raidz_math_get_ops(struct raidz_map *);
|
struct raidz_impl_ops * vdev_raidz_math_get_ops(void);
|
||||||
void vdev_raidz_math_generate(struct raidz_map *);
|
int vdev_raidz_math_generate(struct raidz_map *);
|
||||||
int vdev_raidz_math_reconstruct(struct raidz_map *, const int *,
|
int vdev_raidz_math_reconstruct(struct raidz_map *,
|
||||||
const int *, const int);
|
const int *, const int *, const int);
|
||||||
int vdev_raidz_impl_set(const char *);
|
int vdev_raidz_impl_set(const char *);
|
||||||
|
|
||||||
#ifdef __cplusplus
|
#ifdef __cplusplus
|
||||||
|
@ -89,13 +89,15 @@ typedef boolean_t (*will_work_f)(void);
|
|||||||
typedef void (*init_impl_f)(void);
|
typedef void (*init_impl_f)(void);
|
||||||
typedef void (*fini_impl_f)(void);
|
typedef void (*fini_impl_f)(void);
|
||||||
|
|
||||||
|
#define RAIDZ_IMPL_NAME_MAX (16)
|
||||||
|
|
||||||
typedef struct raidz_impl_ops {
|
typedef struct raidz_impl_ops {
|
||||||
init_impl_f init;
|
init_impl_f init;
|
||||||
fini_impl_f fini;
|
fini_impl_f fini;
|
||||||
raidz_gen_f gen[RAIDZ_GEN_NUM]; /* Parity generate functions */
|
raidz_gen_f gen[RAIDZ_GEN_NUM]; /* Parity generate functions */
|
||||||
raidz_rec_f rec[RAIDZ_REC_NUM]; /* Data reconstruction functions */
|
raidz_rec_f rec[RAIDZ_REC_NUM]; /* Data reconstruction functions */
|
||||||
will_work_f is_supported; /* Support check function */
|
will_work_f is_supported; /* Support check function */
|
||||||
char *name; /* Name of the implementation */
|
char name[RAIDZ_IMPL_NAME_MAX]; /* Name of the implementation */
|
||||||
} raidz_impl_ops_t;
|
} raidz_impl_ops_t;
|
||||||
|
|
||||||
typedef struct raidz_col {
|
typedef struct raidz_col {
|
||||||
@ -127,6 +129,8 @@ typedef struct raidz_map {
|
|||||||
raidz_col_t rm_col[1]; /* Flexible array of I/O columns */
|
raidz_col_t rm_col[1]; /* Flexible array of I/O columns */
|
||||||
} raidz_map_t;
|
} raidz_map_t;
|
||||||
|
|
||||||
|
#define RAIDZ_ORIGINAL_IMPL (INT_MAX)
|
||||||
|
|
||||||
extern const raidz_impl_ops_t vdev_raidz_scalar_impl;
|
extern const raidz_impl_ops_t vdev_raidz_scalar_impl;
|
||||||
#if defined(__x86_64) && defined(HAVE_SSE2) /* only x86_64 for now */
|
#if defined(__x86_64) && defined(HAVE_SSE2) /* only x86_64 for now */
|
||||||
extern const raidz_impl_ops_t vdev_raidz_sse2_impl;
|
extern const raidz_impl_ops_t vdev_raidz_sse2_impl;
|
||||||
|
@ -1684,7 +1684,7 @@ Default value: \fB4,096\fR.
|
|||||||
\fBzfs_vdev_raidz_impl\fR (string)
|
\fBzfs_vdev_raidz_impl\fR (string)
|
||||||
.ad
|
.ad
|
||||||
.RS 12n
|
.RS 12n
|
||||||
Parameter for selecting raidz implementation to use.
|
Parameter for selecting raidz parity implementation to use.
|
||||||
|
|
||||||
Options marked (always) below may be selected on module load as they are
|
Options marked (always) below may be selected on module load as they are
|
||||||
supported on all systems.
|
supported on all systems.
|
||||||
|
@ -458,8 +458,8 @@ vdev_raidz_map_alloc(zio_t *zio, uint64_t unit_shift, uint64_t dcols,
|
|||||||
zio->io_vsd = rm;
|
zio->io_vsd = rm;
|
||||||
zio->io_vsd_ops = &vdev_raidz_vsd_ops;
|
zio->io_vsd_ops = &vdev_raidz_vsd_ops;
|
||||||
|
|
||||||
/* RAIDZ ops init */
|
/* init RAIDZ parity ops */
|
||||||
vdev_raidz_math_get_ops(rm);
|
rm->rm_ops = vdev_raidz_math_get_ops();
|
||||||
|
|
||||||
return (rm);
|
return (rm);
|
||||||
}
|
}
|
||||||
@ -611,10 +611,9 @@ vdev_raidz_generate_parity_pqr(raidz_map_t *rm)
|
|||||||
void
|
void
|
||||||
vdev_raidz_generate_parity(raidz_map_t *rm)
|
vdev_raidz_generate_parity(raidz_map_t *rm)
|
||||||
{
|
{
|
||||||
if (rm->rm_ops) {
|
/* Generate using the new math implementation */
|
||||||
vdev_raidz_math_generate(rm);
|
if (vdev_raidz_math_generate(rm) != RAIDZ_ORIGINAL_IMPL)
|
||||||
return;
|
return;
|
||||||
}
|
|
||||||
|
|
||||||
switch (rm->rm_firstdatacol) {
|
switch (rm->rm_firstdatacol) {
|
||||||
case 1:
|
case 1:
|
||||||
@ -1284,7 +1283,7 @@ vdev_raidz_reconstruct(raidz_map_t *rm, const int *t, int nt)
|
|||||||
{
|
{
|
||||||
int tgts[VDEV_RAIDZ_MAXPARITY], *dt;
|
int tgts[VDEV_RAIDZ_MAXPARITY], *dt;
|
||||||
int ntgts;
|
int ntgts;
|
||||||
int i, c;
|
int i, c, ret;
|
||||||
int code;
|
int code;
|
||||||
int nbadparity, nbaddata;
|
int nbadparity, nbaddata;
|
||||||
int parity_valid[VDEV_RAIDZ_MAXPARITY];
|
int parity_valid[VDEV_RAIDZ_MAXPARITY];
|
||||||
@ -1322,14 +1321,11 @@ vdev_raidz_reconstruct(raidz_map_t *rm, const int *t, int nt)
|
|||||||
|
|
||||||
dt = &tgts[nbadparity];
|
dt = &tgts[nbadparity];
|
||||||
|
|
||||||
/*
|
|
||||||
* Reconstruct using the new math implementation if
|
/* Reconstruct using the new math implementation */
|
||||||
* rm_ops is set.
|
ret = vdev_raidz_math_reconstruct(rm, parity_valid, dt, nbaddata);
|
||||||
*/
|
if (ret != RAIDZ_ORIGINAL_IMPL)
|
||||||
if (rm->rm_ops) {
|
return (ret);
|
||||||
return (vdev_raidz_math_reconstruct(rm, parity_valid, dt,
|
|
||||||
nbaddata));
|
|
||||||
}
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* See if we can use any of our optimized reconstruction routines.
|
* See if we can use any of our optimized reconstruction routines.
|
||||||
|
@ -31,8 +31,22 @@
|
|||||||
#include <sys/vdev_raidz.h>
|
#include <sys/vdev_raidz.h>
|
||||||
#include <sys/vdev_raidz_impl.h>
|
#include <sys/vdev_raidz_impl.h>
|
||||||
|
|
||||||
|
extern boolean_t raidz_will_scalar_work(void);
|
||||||
|
|
||||||
|
/* Opaque implementation with NULL methods to represent original methods */
|
||||||
|
static const raidz_impl_ops_t vdev_raidz_original_impl = {
|
||||||
|
.name = "original",
|
||||||
|
.is_supported = raidz_will_scalar_work,
|
||||||
|
};
|
||||||
|
|
||||||
|
/* RAIDZ parity op that contain the fastest methods */
|
||||||
|
static raidz_impl_ops_t vdev_raidz_fastest_impl = {
|
||||||
|
.name = "fastest"
|
||||||
|
};
|
||||||
|
|
||||||
/* All compiled in implementations */
|
/* All compiled in implementations */
|
||||||
const raidz_impl_ops_t *raidz_all_maths[] = {
|
const raidz_impl_ops_t *raidz_all_maths[] = {
|
||||||
|
&vdev_raidz_original_impl,
|
||||||
&vdev_raidz_scalar_impl,
|
&vdev_raidz_scalar_impl,
|
||||||
#if defined(__x86_64) && defined(HAVE_SSE2) /* only x86_64 for now */
|
#if defined(__x86_64) && defined(HAVE_SSE2) /* only x86_64 for now */
|
||||||
&vdev_raidz_sse2_impl,
|
&vdev_raidz_sse2_impl,
|
||||||
@ -49,30 +63,19 @@ const raidz_impl_ops_t *raidz_all_maths[] = {
|
|||||||
static boolean_t raidz_math_initialized = B_FALSE;
|
static boolean_t raidz_math_initialized = B_FALSE;
|
||||||
|
|
||||||
/* Select raidz implementation */
|
/* Select raidz implementation */
|
||||||
static enum vdev_raidz_impl_sel {
|
#define IMPL_FASTEST (UINT32_MAX)
|
||||||
IMPL_FASTEST = -1,
|
#define IMPL_CYCLE (UINT32_MAX - 1)
|
||||||
IMPL_ORIGINAL = -2,
|
#define IMPL_ORIGINAL (0)
|
||||||
IMPL_CYCLE = -3,
|
#define IMPL_SCALAR (1)
|
||||||
IMPL_SCALAR = 0,
|
|
||||||
} zfs_vdev_raidz_impl = IMPL_SCALAR;
|
|
||||||
|
|
||||||
/* selected implementation and its lock */
|
#define RAIDZ_IMPL_READ(i) (*(volatile uint32_t *) &(i))
|
||||||
static krwlock_t vdev_raidz_impl_lock;
|
|
||||||
static raidz_impl_ops_t *vdev_raidz_used_impl =
|
|
||||||
(raidz_impl_ops_t *) &vdev_raidz_scalar_impl;
|
|
||||||
static boolean_t vdev_raidz_impl_user_set = B_FALSE;
|
|
||||||
|
|
||||||
/* RAIDZ op that contain the fastest routines */
|
static uint32_t zfs_vdev_raidz_impl = IMPL_SCALAR;
|
||||||
static raidz_impl_ops_t vdev_raidz_fastest_impl = {
|
static uint32_t user_sel_impl = IMPL_FASTEST;
|
||||||
.name = "fastest"
|
|
||||||
};
|
|
||||||
|
|
||||||
/* Hold all supported implementations */
|
/* Hold all supported implementations */
|
||||||
size_t raidz_supp_impl_cnt = 1;
|
static size_t raidz_supp_impl_cnt = 0;
|
||||||
raidz_impl_ops_t *raidz_supp_impl[ARRAY_SIZE(raidz_all_maths) + 1] = {
|
static raidz_impl_ops_t *raidz_supp_impl[ARRAY_SIZE(raidz_all_maths)];
|
||||||
(raidz_impl_ops_t *) &vdev_raidz_scalar_impl, /* scalar is supported */
|
|
||||||
NULL
|
|
||||||
};
|
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* kstats values for supported impl & original methods
|
* kstats values for supported impl & original methods
|
||||||
@ -87,33 +90,52 @@ static kstat_t *raidz_math_kstat = NULL;
|
|||||||
* Selects the raidz operation for raidz_map
|
* Selects the raidz operation for raidz_map
|
||||||
* If rm_ops is set to NULL original raidz implementation will be used
|
* If rm_ops is set to NULL original raidz implementation will be used
|
||||||
*/
|
*/
|
||||||
void
|
raidz_impl_ops_t *
|
||||||
vdev_raidz_math_get_ops(raidz_map_t *rm)
|
vdev_raidz_math_get_ops()
|
||||||
{
|
{
|
||||||
rw_enter(&vdev_raidz_impl_lock, RW_READER);
|
raidz_impl_ops_t *ops = NULL;
|
||||||
|
const uint32_t impl = RAIDZ_IMPL_READ(zfs_vdev_raidz_impl);
|
||||||
rm->rm_ops = vdev_raidz_used_impl;
|
|
||||||
|
|
||||||
|
switch (impl) {
|
||||||
|
case IMPL_FASTEST:
|
||||||
|
ASSERT(raidz_math_initialized);
|
||||||
|
ops = &vdev_raidz_fastest_impl;
|
||||||
|
break;
|
||||||
#if !defined(_KERNEL)
|
#if !defined(_KERNEL)
|
||||||
if (zfs_vdev_raidz_impl == IMPL_CYCLE) {
|
case IMPL_CYCLE:
|
||||||
|
{
|
||||||
|
ASSERT(raidz_math_initialized);
|
||||||
|
ASSERT3U(raidz_supp_impl_cnt, >, 0);
|
||||||
|
/* Cycle through all supported implementations */
|
||||||
static size_t cycle_impl_idx = 0;
|
static size_t cycle_impl_idx = 0;
|
||||||
size_t idx;
|
size_t idx = (++cycle_impl_idx) % raidz_supp_impl_cnt;
|
||||||
/*
|
ops = raidz_supp_impl[idx];
|
||||||
* Cycle through all supported new implementations, and
|
|
||||||
* when idx == raidz_supp_impl_cnt, use the original
|
|
||||||
*/
|
|
||||||
idx = (++cycle_impl_idx) % (raidz_supp_impl_cnt + 1);
|
|
||||||
rm->rm_ops = raidz_supp_impl[idx];
|
|
||||||
}
|
}
|
||||||
|
break;
|
||||||
#endif
|
#endif
|
||||||
|
case IMPL_ORIGINAL:
|
||||||
|
ops = (raidz_impl_ops_t *) &vdev_raidz_original_impl;
|
||||||
|
break;
|
||||||
|
case IMPL_SCALAR:
|
||||||
|
ops = (raidz_impl_ops_t *) &vdev_raidz_scalar_impl;
|
||||||
|
break;
|
||||||
|
default:
|
||||||
|
ASSERT(raidz_math_initialized);
|
||||||
|
ASSERT3U(impl, <, raidz_supp_impl_cnt);
|
||||||
|
ASSERT3U(raidz_supp_impl_cnt, >, 0);
|
||||||
|
ops = raidz_supp_impl[impl];
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
rw_exit(&vdev_raidz_impl_lock);
|
ASSERT3P(ops, !=, NULL);
|
||||||
|
|
||||||
|
return (ops);
|
||||||
}
|
}
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Select parity generation method for raidz_map
|
* Select parity generation method for raidz_map
|
||||||
*/
|
*/
|
||||||
void
|
int
|
||||||
vdev_raidz_math_generate(raidz_map_t *rm)
|
vdev_raidz_math_generate(raidz_map_t *rm)
|
||||||
{
|
{
|
||||||
raidz_gen_f gen_parity = NULL;
|
raidz_gen_f gen_parity = NULL;
|
||||||
@ -135,13 +157,17 @@ vdev_raidz_math_generate(raidz_map_t *rm)
|
|||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
ASSERT(gen_parity != NULL);
|
/* if method is NULL execute the original implementation */
|
||||||
|
if (gen_parity == NULL)
|
||||||
|
return (RAIDZ_ORIGINAL_IMPL);
|
||||||
|
|
||||||
gen_parity(rm);
|
gen_parity(rm);
|
||||||
|
|
||||||
|
return (0);
|
||||||
}
|
}
|
||||||
|
|
||||||
static raidz_rec_f
|
static raidz_rec_f
|
||||||
_reconstruct_fun_raidz1(raidz_map_t *rm, const int *parity_valid,
|
reconstruct_fun_p_sel(raidz_map_t *rm, const int *parity_valid,
|
||||||
const int nbaddata)
|
const int nbaddata)
|
||||||
{
|
{
|
||||||
if (nbaddata == 1 && parity_valid[CODE_P]) {
|
if (nbaddata == 1 && parity_valid[CODE_P]) {
|
||||||
@ -151,7 +177,7 @@ _reconstruct_fun_raidz1(raidz_map_t *rm, const int *parity_valid,
|
|||||||
}
|
}
|
||||||
|
|
||||||
static raidz_rec_f
|
static raidz_rec_f
|
||||||
_reconstruct_fun_raidz2(raidz_map_t *rm, const int *parity_valid,
|
reconstruct_fun_pq_sel(raidz_map_t *rm, const int *parity_valid,
|
||||||
const int nbaddata)
|
const int nbaddata)
|
||||||
{
|
{
|
||||||
if (nbaddata == 1) {
|
if (nbaddata == 1) {
|
||||||
@ -168,7 +194,7 @@ _reconstruct_fun_raidz2(raidz_map_t *rm, const int *parity_valid,
|
|||||||
}
|
}
|
||||||
|
|
||||||
static raidz_rec_f
|
static raidz_rec_f
|
||||||
_reconstruct_fun_raidz3(raidz_map_t *rm, const int *parity_valid,
|
reconstruct_fun_pqr_sel(raidz_map_t *rm, const int *parity_valid,
|
||||||
const int nbaddata)
|
const int nbaddata)
|
||||||
{
|
{
|
||||||
if (nbaddata == 1) {
|
if (nbaddata == 1) {
|
||||||
@ -208,17 +234,14 @@ vdev_raidz_math_reconstruct(raidz_map_t *rm, const int *parity_valid,
|
|||||||
raidz_rec_f rec_data = NULL;
|
raidz_rec_f rec_data = NULL;
|
||||||
|
|
||||||
switch (raidz_parity(rm)) {
|
switch (raidz_parity(rm)) {
|
||||||
case 1:
|
case PARITY_P:
|
||||||
rec_data = _reconstruct_fun_raidz1(rm, parity_valid,
|
rec_data = reconstruct_fun_p_sel(rm, parity_valid, nbaddata);
|
||||||
nbaddata);
|
|
||||||
break;
|
break;
|
||||||
case 2:
|
case PARITY_PQ:
|
||||||
rec_data = _reconstruct_fun_raidz2(rm, parity_valid,
|
rec_data = reconstruct_fun_pq_sel(rm, parity_valid, nbaddata);
|
||||||
nbaddata);
|
|
||||||
break;
|
break;
|
||||||
case 3:
|
case PARITY_PQR:
|
||||||
rec_data = _reconstruct_fun_raidz3(rm, parity_valid,
|
rec_data = reconstruct_fun_pqr_sel(rm, parity_valid, nbaddata);
|
||||||
nbaddata);
|
|
||||||
break;
|
break;
|
||||||
default:
|
default:
|
||||||
cmn_err(CE_PANIC, "invalid RAID-Z configuration %d",
|
cmn_err(CE_PANIC, "invalid RAID-Z configuration %d",
|
||||||
@ -226,8 +249,9 @@ vdev_raidz_math_reconstruct(raidz_map_t *rm, const int *parity_valid,
|
|||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
||||||
ASSERT(rec_data != NULL);
|
if (rec_data == NULL)
|
||||||
|
return (RAIDZ_ORIGINAL_IMPL);
|
||||||
|
else
|
||||||
return (rec_data(rm, dt));
|
return (rec_data(rm, dt));
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -309,13 +333,10 @@ benchmark_raidz_impl(raidz_map_t *bench_rm, const int fn, benchmark_fn bench_fn)
|
|||||||
uint64_t run_cnt, speed, best_speed = 0;
|
uint64_t run_cnt, speed, best_speed = 0;
|
||||||
hrtime_t t_start, t_diff;
|
hrtime_t t_start, t_diff;
|
||||||
raidz_impl_ops_t *curr_impl;
|
raidz_impl_ops_t *curr_impl;
|
||||||
|
raidz_impl_kstat_t * fstat = &raidz_impl_kstats[raidz_supp_impl_cnt];
|
||||||
int impl, i;
|
int impl, i;
|
||||||
|
|
||||||
/*
|
for (impl = 0; impl < raidz_supp_impl_cnt; impl++) {
|
||||||
* Use the sentinel (NULL) from the end of raidz_supp_impl_cnt
|
|
||||||
* to run "original" implementation (bench_rm->rm_ops = NULL)
|
|
||||||
*/
|
|
||||||
for (impl = 0; impl <= raidz_supp_impl_cnt; impl++) {
|
|
||||||
/* set an implementation to benchmark */
|
/* set an implementation to benchmark */
|
||||||
curr_impl = raidz_supp_impl[impl];
|
curr_impl = raidz_supp_impl[impl];
|
||||||
bench_rm->rm_ops = curr_impl;
|
bench_rm->rm_ops = curr_impl;
|
||||||
@ -338,16 +359,19 @@ benchmark_raidz_impl(raidz_map_t *bench_rm, const int fn, benchmark_fn bench_fn)
|
|||||||
else
|
else
|
||||||
raidz_impl_kstats[impl].rec[fn].value.ui64 = speed;
|
raidz_impl_kstats[impl].rec[fn].value.ui64 = speed;
|
||||||
|
|
||||||
/* if curr_impl==NULL the original impl is benchmarked */
|
/* Update fastest implementation method */
|
||||||
if (curr_impl != NULL && speed > best_speed) {
|
if (speed > best_speed) {
|
||||||
best_speed = speed;
|
best_speed = speed;
|
||||||
|
|
||||||
if (bench_fn == benchmark_gen_impl)
|
if (bench_fn == benchmark_gen_impl) {
|
||||||
vdev_raidz_fastest_impl.gen[fn] =
|
vdev_raidz_fastest_impl.gen[fn] =
|
||||||
curr_impl->gen[fn];
|
curr_impl->gen[fn];
|
||||||
else
|
fstat->gen[fn].value.ui64 = speed;
|
||||||
|
} else {
|
||||||
vdev_raidz_fastest_impl.rec[fn] =
|
vdev_raidz_fastest_impl.rec[fn] =
|
||||||
curr_impl->rec[fn];
|
curr_impl->rec[fn];
|
||||||
|
fstat->rec[fn].value.ui64 = speed;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
@ -361,9 +385,6 @@ vdev_raidz_math_init(void)
|
|||||||
uint64_t bench_parity;
|
uint64_t bench_parity;
|
||||||
int i, c, fn;
|
int i, c, fn;
|
||||||
|
|
||||||
/* init & vdev_raidz_impl_lock */
|
|
||||||
rw_init(&vdev_raidz_impl_lock, NULL, RW_DEFAULT, NULL);
|
|
||||||
|
|
||||||
/* move supported impl into raidz_supp_impl */
|
/* move supported impl into raidz_supp_impl */
|
||||||
for (i = 0, c = 0; i < ARRAY_SIZE(raidz_all_maths); i++) {
|
for (i = 0, c = 0; i < ARRAY_SIZE(raidz_all_maths); i++) {
|
||||||
curr_impl = (raidz_impl_ops_t *) raidz_all_maths[i];
|
curr_impl = (raidz_impl_ops_t *) raidz_all_maths[i];
|
||||||
@ -379,20 +400,16 @@ vdev_raidz_math_init(void)
|
|||||||
raidz_supp_impl[c++] = (raidz_impl_ops_t *) curr_impl;
|
raidz_supp_impl[c++] = (raidz_impl_ops_t *) curr_impl;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
membar_producer(); /* complete raidz_supp_impl[] init */
|
||||||
raidz_supp_impl_cnt = c; /* number of supported impl */
|
raidz_supp_impl_cnt = c; /* number of supported impl */
|
||||||
raidz_supp_impl[c] = NULL; /* sentinel */
|
|
||||||
|
|
||||||
/* init kstat for original routines */
|
init_raidz_kstat(&(raidz_impl_kstats[raidz_supp_impl_cnt]), "fastest");
|
||||||
init_raidz_kstat(&(raidz_impl_kstats[raidz_supp_impl_cnt]), "original");
|
|
||||||
|
|
||||||
#if !defined(_KERNEL)
|
#if !defined(_KERNEL)
|
||||||
/*
|
/* Skip benchmarking and use last implementation as fastest */
|
||||||
* Skip benchmarking and use last implementation as fastest
|
|
||||||
*/
|
|
||||||
memcpy(&vdev_raidz_fastest_impl, raidz_supp_impl[raidz_supp_impl_cnt-1],
|
memcpy(&vdev_raidz_fastest_impl, raidz_supp_impl[raidz_supp_impl_cnt-1],
|
||||||
sizeof (vdev_raidz_fastest_impl));
|
sizeof (vdev_raidz_fastest_impl));
|
||||||
|
strcpy(vdev_raidz_fastest_impl.name, "fastest");
|
||||||
vdev_raidz_fastest_impl.name = "fastest";
|
|
||||||
|
|
||||||
raidz_math_initialized = B_TRUE;
|
raidz_math_initialized = B_TRUE;
|
||||||
|
|
||||||
@ -407,12 +424,13 @@ vdev_raidz_math_init(void)
|
|||||||
bench_zio->io_size = BENCH_ZIO_SIZE; /* only data columns */
|
bench_zio->io_size = BENCH_ZIO_SIZE; /* only data columns */
|
||||||
bench_zio->io_data = zio_data_buf_alloc(BENCH_ZIO_SIZE);
|
bench_zio->io_data = zio_data_buf_alloc(BENCH_ZIO_SIZE);
|
||||||
VERIFY(bench_zio->io_data);
|
VERIFY(bench_zio->io_data);
|
||||||
|
memset(bench_zio->io_data, 0xAA, BENCH_ZIO_SIZE); /* warm up */
|
||||||
|
|
||||||
/* Benchmark parity generation methods */
|
/* Benchmark parity generation methods */
|
||||||
for (fn = 0; fn < RAIDZ_GEN_NUM; fn++) {
|
for (fn = 0; fn < RAIDZ_GEN_NUM; fn++) {
|
||||||
bench_parity = fn + 1;
|
bench_parity = fn + 1;
|
||||||
/* New raidz_map is needed for each generate_p/q/r */
|
/* New raidz_map is needed for each generate_p/q/r */
|
||||||
bench_rm = vdev_raidz_map_alloc(bench_zio, 9,
|
bench_rm = vdev_raidz_map_alloc(bench_zio, SPA_MINBLOCKSHIFT,
|
||||||
BENCH_D_COLS + bench_parity, bench_parity);
|
BENCH_D_COLS + bench_parity, bench_parity);
|
||||||
|
|
||||||
benchmark_raidz_impl(bench_rm, fn, benchmark_gen_impl);
|
benchmark_raidz_impl(bench_rm, fn, benchmark_gen_impl);
|
||||||
@ -421,7 +439,8 @@ vdev_raidz_math_init(void)
|
|||||||
}
|
}
|
||||||
|
|
||||||
/* Benchmark data reconstruction methods */
|
/* Benchmark data reconstruction methods */
|
||||||
bench_rm = vdev_raidz_map_alloc(bench_zio, 9, BENCH_COLS, PARITY_PQR);
|
bench_rm = vdev_raidz_map_alloc(bench_zio, SPA_MINBLOCKSHIFT,
|
||||||
|
BENCH_COLS, PARITY_PQR);
|
||||||
|
|
||||||
for (fn = 0; fn < RAIDZ_REC_NUM; fn++)
|
for (fn = 0; fn < RAIDZ_REC_NUM; fn++)
|
||||||
benchmark_raidz_impl(bench_rm, fn, benchmark_rec_impl);
|
benchmark_raidz_impl(bench_rm, fn, benchmark_rec_impl);
|
||||||
@ -444,9 +463,8 @@ vdev_raidz_math_init(void)
|
|||||||
}
|
}
|
||||||
|
|
||||||
/* Finish initialization */
|
/* Finish initialization */
|
||||||
|
atomic_swap_32(&zfs_vdev_raidz_impl, user_sel_impl);
|
||||||
raidz_math_initialized = B_TRUE;
|
raidz_math_initialized = B_TRUE;
|
||||||
if (!vdev_raidz_impl_user_set)
|
|
||||||
VERIFY0(vdev_raidz_impl_set("fastest"));
|
|
||||||
}
|
}
|
||||||
|
|
||||||
void
|
void
|
||||||
@ -460,33 +478,33 @@ vdev_raidz_math_fini(void)
|
|||||||
raidz_math_kstat = NULL;
|
raidz_math_kstat = NULL;
|
||||||
}
|
}
|
||||||
|
|
||||||
rw_destroy(&vdev_raidz_impl_lock);
|
|
||||||
|
|
||||||
/* fini impl */
|
/* fini impl */
|
||||||
for (i = 0; i < ARRAY_SIZE(raidz_all_maths); i++) {
|
for (i = 0; i < ARRAY_SIZE(raidz_all_maths); i++) {
|
||||||
curr_impl = raidz_all_maths[i];
|
curr_impl = raidz_all_maths[i];
|
||||||
|
|
||||||
if (curr_impl->fini)
|
if (curr_impl->fini)
|
||||||
curr_impl->fini();
|
curr_impl->fini();
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
static const
|
static const struct {
|
||||||
struct {
|
|
||||||
char *name;
|
char *name;
|
||||||
raidz_impl_ops_t *impl;
|
uint32_t sel;
|
||||||
enum vdev_raidz_impl_sel sel;
|
|
||||||
} math_impl_opts[] = {
|
} math_impl_opts[] = {
|
||||||
{ "fastest", &vdev_raidz_fastest_impl, IMPL_FASTEST },
|
|
||||||
{ "original", NULL, IMPL_ORIGINAL },
|
|
||||||
#if !defined(_KERNEL)
|
#if !defined(_KERNEL)
|
||||||
{ "cycle", NULL, IMPL_CYCLE },
|
{ "cycle", IMPL_CYCLE },
|
||||||
#endif
|
#endif
|
||||||
|
{ "fastest", IMPL_FASTEST },
|
||||||
|
{ "original", IMPL_ORIGINAL },
|
||||||
|
{ "scalar", IMPL_SCALAR }
|
||||||
};
|
};
|
||||||
|
|
||||||
/*
|
/*
|
||||||
* Function sets desired raidz implementation.
|
* Function sets desired raidz implementation.
|
||||||
* If called after module_init(), vdev_raidz_impl_lock must be held for writing.
|
*
|
||||||
|
* If we are called before init(), user preference will be saved in
|
||||||
|
* user_sel_impl, and applied in later init() call. This occurs when module
|
||||||
|
* parameter is specified on module load. Otherwise, directly update
|
||||||
|
* zfs_vdev_raidz_impl.
|
||||||
*
|
*
|
||||||
* @val Name of raidz implementation to use
|
* @val Name of raidz implementation to use
|
||||||
* @param Unused.
|
* @param Unused.
|
||||||
@ -494,42 +512,58 @@ struct {
|
|||||||
static int
|
static int
|
||||||
zfs_vdev_raidz_impl_set(const char *val, struct kernel_param *kp)
|
zfs_vdev_raidz_impl_set(const char *val, struct kernel_param *kp)
|
||||||
{
|
{
|
||||||
|
int err = -EINVAL;
|
||||||
|
char req_name[RAIDZ_IMPL_NAME_MAX];
|
||||||
|
uint32_t impl = RAIDZ_IMPL_READ(user_sel_impl);
|
||||||
size_t i;
|
size_t i;
|
||||||
|
|
||||||
|
/* sanitize input */
|
||||||
|
i = strnlen(val, RAIDZ_IMPL_NAME_MAX);
|
||||||
|
if (i == 0 || i == RAIDZ_IMPL_NAME_MAX)
|
||||||
|
return (err);
|
||||||
|
|
||||||
|
strlcpy(req_name, val, RAIDZ_IMPL_NAME_MAX);
|
||||||
|
while (i > 0 && !!isspace(req_name[i-1]))
|
||||||
|
i--;
|
||||||
|
req_name[i] = '\0';
|
||||||
|
|
||||||
/* Check mandatory options */
|
/* Check mandatory options */
|
||||||
for (i = 0; i < ARRAY_SIZE(math_impl_opts); i++) {
|
for (i = 0; i < ARRAY_SIZE(math_impl_opts); i++) {
|
||||||
if (strcmp(val, math_impl_opts[i].name) == 0) {
|
if (strcmp(req_name, math_impl_opts[i].name) == 0) {
|
||||||
zfs_vdev_raidz_impl = math_impl_opts[i].sel;
|
impl = math_impl_opts[i].sel;
|
||||||
vdev_raidz_used_impl = math_impl_opts[i].impl;
|
err = 0;
|
||||||
vdev_raidz_impl_user_set = B_TRUE;
|
break;
|
||||||
return (0);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
/* check all supported impl if init() was already called */
|
||||||
|
if (err != 0 && raidz_math_initialized) {
|
||||||
/* check all supported implementations */
|
/* check all supported implementations */
|
||||||
for (i = 0; i < raidz_supp_impl_cnt; i++) {
|
for (i = 0; i < raidz_supp_impl_cnt; i++) {
|
||||||
if (strcmp(val, raidz_supp_impl[i]->name) == 0) {
|
if (strcmp(req_name, raidz_supp_impl[i]->name) == 0) {
|
||||||
zfs_vdev_raidz_impl = i;
|
impl = i;
|
||||||
vdev_raidz_used_impl = raidz_supp_impl[i];
|
err = 0;
|
||||||
vdev_raidz_impl_user_set = B_TRUE;
|
break;
|
||||||
return (0);
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
return (-EINVAL);
|
if (err == 0) {
|
||||||
|
if (raidz_math_initialized)
|
||||||
|
atomic_swap_32(&zfs_vdev_raidz_impl, impl);
|
||||||
|
else
|
||||||
|
atomic_swap_32(&user_sel_impl, impl);
|
||||||
|
}
|
||||||
|
|
||||||
|
return (err);
|
||||||
}
|
}
|
||||||
|
|
||||||
int
|
int
|
||||||
vdev_raidz_impl_set(const char *val)
|
vdev_raidz_impl_set(const char *val)
|
||||||
{
|
{
|
||||||
int err;
|
|
||||||
|
|
||||||
ASSERT(raidz_math_initialized);
|
ASSERT(raidz_math_initialized);
|
||||||
|
|
||||||
rw_enter(&vdev_raidz_impl_lock, RW_WRITER);
|
return (zfs_vdev_raidz_impl_set(val, NULL));
|
||||||
err = zfs_vdev_raidz_impl_set(val, NULL);
|
|
||||||
rw_exit(&vdev_raidz_impl_lock);
|
|
||||||
return (err);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
#if defined(_KERNEL) && defined(HAVE_SPL)
|
#if defined(_KERNEL) && defined(HAVE_SPL)
|
||||||
@ -538,29 +572,22 @@ zfs_vdev_raidz_impl_get(char *buffer, struct kernel_param *kp)
|
|||||||
{
|
{
|
||||||
int i, cnt = 0;
|
int i, cnt = 0;
|
||||||
char *fmt;
|
char *fmt;
|
||||||
|
const uint32_t impl = RAIDZ_IMPL_READ(zfs_vdev_raidz_impl);
|
||||||
|
|
||||||
ASSERT(raidz_math_initialized);
|
ASSERT(raidz_math_initialized);
|
||||||
|
|
||||||
rw_enter(&vdev_raidz_impl_lock, RW_READER);
|
|
||||||
|
|
||||||
/* list mandatory options */
|
/* list mandatory options */
|
||||||
for (i = 0; i < ARRAY_SIZE(math_impl_opts); i++) {
|
for (i = 0; i < ARRAY_SIZE(math_impl_opts) - 2; i++) {
|
||||||
if (math_impl_opts[i].sel == zfs_vdev_raidz_impl)
|
fmt = (impl == math_impl_opts[i].sel) ? "[%s] " : "%s ";
|
||||||
fmt = "[%s] ";
|
|
||||||
else
|
|
||||||
fmt = "%s ";
|
|
||||||
|
|
||||||
cnt += sprintf(buffer + cnt, fmt, math_impl_opts[i].name);
|
cnt += sprintf(buffer + cnt, fmt, math_impl_opts[i].name);
|
||||||
}
|
}
|
||||||
|
|
||||||
/* list all supported implementations */
|
/* list all supported implementations */
|
||||||
for (i = 0; i < raidz_supp_impl_cnt; i++) {
|
for (i = 0; i < raidz_supp_impl_cnt; i++) {
|
||||||
fmt = (i == zfs_vdev_raidz_impl) ? "[%s] " : "%s ";
|
fmt = (i == impl) ? "[%s] " : "%s ";
|
||||||
cnt += sprintf(buffer + cnt, fmt, raidz_supp_impl[i]->name);
|
cnt += sprintf(buffer + cnt, fmt, raidz_supp_impl[i]->name);
|
||||||
}
|
}
|
||||||
|
|
||||||
rw_exit(&vdev_raidz_impl_lock);
|
|
||||||
|
|
||||||
return (cnt);
|
return (cnt);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -47,10 +47,10 @@
|
|||||||
#define VR1(r...) VR1_(r)
|
#define VR1(r...) VR1_(r)
|
||||||
#define VR2(r...) VR2_(r, 1)
|
#define VR2(r...) VR2_(r, 1)
|
||||||
#define VR3(r...) VR3_(r, 1, 2)
|
#define VR3(r...) VR3_(r, 1, 2)
|
||||||
#define VR4(r...) VR4_(r, 1)
|
#define VR4(r...) VR4_(r, 1, 2)
|
||||||
#define VR5(r...) VR5_(r, 1, 2)
|
#define VR5(r...) VR5_(r, 1, 2, 3)
|
||||||
#define VR6(r...) VR6_(r, 1, 2, 3)
|
#define VR6(r...) VR6_(r, 1, 2, 3, 4)
|
||||||
#define VR7(r...) VR7_(r, 1, 2, 3, 4)
|
#define VR7(r...) VR7_(r, 1, 2, 3, 4, 5)
|
||||||
|
|
||||||
#define R_01(REG1, REG2, ...) REG1, REG2
|
#define R_01(REG1, REG2, ...) REG1, REG2
|
||||||
#define _R_23(_0, _1, REG2, REG3, ...) REG2, REG3
|
#define _R_23(_0, _1, REG2, REG3, ...) REG2, REG3
|
||||||
|
@ -222,7 +222,7 @@ static const struct {
|
|||||||
DEFINE_GEN_METHODS(scalar);
|
DEFINE_GEN_METHODS(scalar);
|
||||||
DEFINE_REC_METHODS(scalar);
|
DEFINE_REC_METHODS(scalar);
|
||||||
|
|
||||||
static boolean_t
|
boolean_t
|
||||||
raidz_will_scalar_work(void)
|
raidz_will_scalar_work(void)
|
||||||
{
|
{
|
||||||
return (B_TRUE); /* always */
|
return (B_TRUE); /* always */
|
||||||
|
@ -47,10 +47,10 @@
|
|||||||
#define VR1(r...) VR1_(r)
|
#define VR1(r...) VR1_(r)
|
||||||
#define VR2(r...) VR2_(r, 1)
|
#define VR2(r...) VR2_(r, 1)
|
||||||
#define VR3(r...) VR3_(r, 1, 2)
|
#define VR3(r...) VR3_(r, 1, 2)
|
||||||
#define VR4(r...) VR4_(r, 1)
|
#define VR4(r...) VR4_(r, 1, 2)
|
||||||
#define VR5(r...) VR5_(r, 1, 2)
|
#define VR5(r...) VR5_(r, 1, 2, 3)
|
||||||
#define VR6(r...) VR6_(r, 1, 2, 3)
|
#define VR6(r...) VR6_(r, 1, 2, 3, 4)
|
||||||
#define VR7(r...) VR7_(r, 1, 2, 3, 4)
|
#define VR7(r...) VR7_(r, 1, 2, 3, 4, 5)
|
||||||
|
|
||||||
#define R_01(REG1, REG2, ...) REG1, REG2
|
#define R_01(REG1, REG2, ...) REG1, REG2
|
||||||
#define _R_23(_0, _1, REG2, REG3, ...) REG2, REG3
|
#define _R_23(_0, _1, REG2, REG3, ...) REG2, REG3
|
||||||
|
Loading…
Reference in New Issue
Block a user