mirror of
https://git.proxmox.com/git/mirror_zfs.git
synced 2025-01-04 23:39:33 +03:00
78289b8458
Currently calls to kfpu_begin() and kfpu_end() are split between the init() and fini() functions of the particular SIMD implementation. This was done in #14247 as an optimization measure for the ABD adapter. Unfortunately the split complicates FPU handling on platforms that use a local FPU state buffer, like Windows and macOS. To ease porting, we introduce a boolean struct member in fletcher_4_ops_t, indicating use of the FPU, and move the FPU state handling from the SIMD implementations to the call sites. Reviewed-by: Tino Reichardt <milky-zfs@mcmilk.de> Reviewed-by: Richard Yao <richard.yao@alumni.stonybrook.edu> Reviewed-by: Jorgen Lundman <lundman@lundman.net> Signed-off-by: Attila Fülöp <attila@fueloep.org> Closes #14600
181 lines
5.7 KiB
C
181 lines
5.7 KiB
C
/*
|
|
* CDDL HEADER START
|
|
*
|
|
* The contents of this file are subject to the terms of the
|
|
* Common Development and Distribution License (the "License").
|
|
* You may not use this file except in compliance with the License.
|
|
*
|
|
* You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
|
|
* or https://opensource.org/licenses/CDDL-1.0.
|
|
* See the License for the specific language governing permissions
|
|
* and limitations under the License.
|
|
*
|
|
* When distributing Covered Code, include this CDDL HEADER in each
|
|
* file and include the License file at usr/src/OPENSOLARIS.LICENSE.
|
|
* If applicable, add the following below this CDDL HEADER, with the
|
|
* fields enclosed by brackets "[]" replaced with your own identifying
|
|
* information: Portions Copyright [yyyy] [name of copyright owner]
|
|
*
|
|
* CDDL HEADER END
|
|
*/
|
|
/*
|
|
* Copyright 2009 Sun Microsystems, Inc. All rights reserved.
|
|
* Use is subject to license terms.
|
|
*/
|
|
/*
|
|
* Copyright 2013 Saso Kiselkov. All rights reserved.
|
|
*/
|
|
|
|
#ifndef _ZFS_FLETCHER_H
|
|
#define _ZFS_FLETCHER_H extern __attribute__((visibility("default")))
|
|
|
|
#include <sys/types.h>
|
|
#include <sys/spa_checksum.h>
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
/*
|
|
* fletcher checksum functions
|
|
*
|
|
* Note: Fletcher checksum methods expect buffer size to be 4B aligned. This
|
|
* limitation stems from the algorithm design. Performing incremental checksum
|
|
* without said alignment would yield different results. Therefore, the code
|
|
* includes assertions for the size alignment.
|
|
* For compatibility, it is required that some code paths calculate checksum of
|
|
* non-aligned buffer sizes. For this purpose, `fletcher_4_native_varsize()`
|
|
* checksum method is added. This method will ignore last (size % 4) bytes of
|
|
* the data buffer.
|
|
*/
|
|
_ZFS_FLETCHER_H void fletcher_init(zio_cksum_t *);
|
|
_ZFS_FLETCHER_H void fletcher_2_native(const void *, uint64_t, const void *,
|
|
zio_cksum_t *);
|
|
_ZFS_FLETCHER_H void fletcher_2_byteswap(const void *, uint64_t, const void *,
|
|
zio_cksum_t *);
|
|
_ZFS_FLETCHER_H void fletcher_4_native(const void *, uint64_t, const void *,
|
|
zio_cksum_t *);
|
|
_ZFS_FLETCHER_H int fletcher_2_incremental_native(void *, size_t, void *);
|
|
_ZFS_FLETCHER_H int fletcher_2_incremental_byteswap(void *, size_t, void *);
|
|
_ZFS_FLETCHER_H void fletcher_4_native_varsize(const void *, uint64_t,
|
|
zio_cksum_t *);
|
|
_ZFS_FLETCHER_H void fletcher_4_byteswap(const void *, uint64_t, const void *,
|
|
zio_cksum_t *);
|
|
_ZFS_FLETCHER_H int fletcher_4_incremental_native(void *, size_t, void *);
|
|
_ZFS_FLETCHER_H int fletcher_4_incremental_byteswap(void *, size_t, void *);
|
|
_ZFS_FLETCHER_H int fletcher_4_impl_set(const char *selector);
|
|
_ZFS_FLETCHER_H void fletcher_4_init(void);
|
|
_ZFS_FLETCHER_H void fletcher_4_fini(void);
|
|
|
|
|
|
|
|
/* Internal fletcher ctx */
|
|
|
|
typedef struct zfs_fletcher_superscalar {
|
|
uint64_t v[4];
|
|
} zfs_fletcher_superscalar_t;
|
|
|
|
typedef struct zfs_fletcher_sse {
|
|
uint64_t v[2] __attribute__((aligned(16)));
|
|
} zfs_fletcher_sse_t;
|
|
|
|
typedef struct zfs_fletcher_avx {
|
|
uint64_t v[4] __attribute__((aligned(32)));
|
|
} zfs_fletcher_avx_t;
|
|
|
|
typedef struct zfs_fletcher_avx512 {
|
|
uint64_t v[8] __attribute__((aligned(64)));
|
|
} zfs_fletcher_avx512_t;
|
|
|
|
typedef struct zfs_fletcher_aarch64_neon {
|
|
uint64_t v[2] __attribute__((aligned(16)));
|
|
} zfs_fletcher_aarch64_neon_t;
|
|
|
|
|
|
typedef union fletcher_4_ctx {
|
|
zio_cksum_t scalar;
|
|
zfs_fletcher_superscalar_t superscalar[4];
|
|
|
|
#if defined(HAVE_SSE2) || (defined(HAVE_SSE2) && defined(HAVE_SSSE3))
|
|
zfs_fletcher_sse_t sse[4];
|
|
#endif
|
|
#if defined(HAVE_AVX) && defined(HAVE_AVX2)
|
|
zfs_fletcher_avx_t avx[4];
|
|
#endif
|
|
#if defined(__x86_64) && defined(HAVE_AVX512F)
|
|
zfs_fletcher_avx512_t avx512[4];
|
|
#endif
|
|
#if defined(__aarch64__)
|
|
zfs_fletcher_aarch64_neon_t aarch64_neon[4];
|
|
#endif
|
|
} fletcher_4_ctx_t;
|
|
|
|
/*
|
|
* fletcher checksum struct
|
|
*/
|
|
typedef void (*fletcher_4_init_f)(fletcher_4_ctx_t *);
|
|
typedef void (*fletcher_4_fini_f)(fletcher_4_ctx_t *, zio_cksum_t *);
|
|
typedef void (*fletcher_4_compute_f)(fletcher_4_ctx_t *,
|
|
const void *, uint64_t);
|
|
|
|
typedef struct fletcher_4_func {
|
|
fletcher_4_init_f init_native;
|
|
fletcher_4_fini_f fini_native;
|
|
fletcher_4_compute_f compute_native;
|
|
fletcher_4_init_f init_byteswap;
|
|
fletcher_4_fini_f fini_byteswap;
|
|
fletcher_4_compute_f compute_byteswap;
|
|
boolean_t (*valid)(void);
|
|
boolean_t uses_fpu;
|
|
const char *name;
|
|
} __attribute__((aligned(64))) fletcher_4_ops_t;
|
|
|
|
_ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_superscalar_ops;
|
|
_ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_superscalar4_ops;
|
|
|
|
#if defined(HAVE_SSE2)
|
|
_ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_sse2_ops;
|
|
#endif
|
|
|
|
#if defined(HAVE_SSE2) && defined(HAVE_SSSE3)
|
|
_ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_ssse3_ops;
|
|
#endif
|
|
|
|
#if defined(HAVE_AVX) && defined(HAVE_AVX2)
|
|
_ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_avx2_ops;
|
|
#endif
|
|
|
|
#if defined(__x86_64) && defined(HAVE_AVX512F)
|
|
_ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_avx512f_ops;
|
|
#endif
|
|
|
|
#if defined(__x86_64) && defined(HAVE_AVX512BW)
|
|
_ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_avx512bw_ops;
|
|
#endif
|
|
|
|
#if defined(__aarch64__)
|
|
_ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_aarch64_neon_ops;
|
|
#endif
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
|
|
#if defined(ZFS_UBSAN_ENABLED)
|
|
#if defined(__has_attribute)
|
|
#if __has_attribute(no_sanitize_undefined)
|
|
#define ZFS_NO_SANITIZE_UNDEFINED __attribute__((no_sanitize_undefined))
|
|
#elif __has_attribute(no_sanitize)
|
|
#define ZFS_NO_SANITIZE_UNDEFINED __attribute__((no_sanitize("undefined")))
|
|
#else
|
|
#error "Compiler has to support attribute "
|
|
"`no_sanitize_undefined` or `no_sanitize(\"undefined\")`"
|
|
"when compiling with UBSan enabled"
|
|
#endif /* __has_attribute(no_sanitize_undefined) */
|
|
#endif /* defined(__has_attribute) */
|
|
#else
|
|
#define ZFS_NO_SANITIZE_UNDEFINED
|
|
#endif /* defined(ZFS_UBSAN_ENABLED) */
|
|
|
|
#endif /* _ZFS_FLETCHER_H */
|