mirror of
				https://git.proxmox.com/git/mirror_zfs
				synced 2025-10-25 16:24:29 +00:00 
			
		
		
		
	 0ad5f43442
			
		
	
	
		0ad5f43442
		
			
		
	
	
	
	
		
			
			This is probably the uncontroversial part of #13631, which fixes a real problem people are having. There's still things to improve in our code after this is merged, but it should stop the breakage that people have reported, where we lie about a type always being aligned and then pass in stack objects with no alignment requirement and hope for the best. Of course, our SIMD code was written with unaligned accesses, so it doesn't care if we drop this...but some auto-vectorized code that gcc emits sure does, since we told it it can assume they're aligned. Reviewed-by: Brian Behlendorf <behlendorf1@llnl.gov> Reviewed-by: Tino Reichardt <milky-zfs@mcmilk.de> Reviewed-by: Richard Yao <richard.yao@alumni.stonybrook.edu> Signed-off-by: Rich Ercolani <rincebrain@gmail.com> Closes #14649
		
			
				
	
	
		
			165 lines
		
	
	
		
			5.0 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			165 lines
		
	
	
		
			5.0 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * CDDL HEADER START
 | |
|  *
 | |
|  * The contents of this file are subject to the terms of the
 | |
|  * Common Development and Distribution License (the "License").
 | |
|  * You may not use this file except in compliance with the License.
 | |
|  *
 | |
|  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
 | |
|  * or https://opensource.org/licenses/CDDL-1.0.
 | |
|  * See the License for the specific language governing permissions
 | |
|  * and limitations under the License.
 | |
|  *
 | |
|  * When distributing Covered Code, include this CDDL HEADER in each
 | |
|  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
 | |
|  * If applicable, add the following below this CDDL HEADER, with the
 | |
|  * fields enclosed by brackets "[]" replaced with your own identifying
 | |
|  * information: Portions Copyright [yyyy] [name of copyright owner]
 | |
|  *
 | |
|  * CDDL HEADER END
 | |
|  */
 | |
| /*
 | |
|  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
 | |
|  * Use is subject to license terms.
 | |
|  */
 | |
| /*
 | |
|  * Copyright 2013 Saso Kiselkov. All rights reserved.
 | |
|  */
 | |
| 
 | |
| #ifndef	_ZFS_FLETCHER_H
 | |
| #define	_ZFS_FLETCHER_H extern __attribute__((visibility("default")))
 | |
| 
 | |
| #include <sys/types.h>
 | |
| #include <sys/spa_checksum.h>
 | |
| 
 | |
| #ifdef	__cplusplus
 | |
| extern "C" {
 | |
| #endif
 | |
| 
 | |
| /*
 | |
|  * fletcher checksum functions
 | |
|  *
 | |
|  * Note: Fletcher checksum methods expect buffer size to be 4B aligned. This
 | |
|  * limitation stems from the algorithm design. Performing incremental checksum
 | |
|  * without said alignment would yield different results. Therefore, the code
 | |
|  * includes assertions for the size alignment.
 | |
|  * For compatibility, it is required that some code paths calculate checksum of
 | |
|  * non-aligned buffer sizes. For this purpose, `fletcher_4_native_varsize()`
 | |
|  * checksum method is added. This method will ignore last (size % 4) bytes of
 | |
|  * the data buffer.
 | |
|  */
 | |
| _ZFS_FLETCHER_H void fletcher_init(zio_cksum_t *);
 | |
| _ZFS_FLETCHER_H void fletcher_2_native(const void *, uint64_t, const void *,
 | |
|     zio_cksum_t *);
 | |
| _ZFS_FLETCHER_H void fletcher_2_byteswap(const void *, uint64_t, const void *,
 | |
|     zio_cksum_t *);
 | |
| _ZFS_FLETCHER_H void fletcher_4_native(const void *, uint64_t, const void *,
 | |
|     zio_cksum_t *);
 | |
| _ZFS_FLETCHER_H int fletcher_2_incremental_native(void *, size_t, void *);
 | |
| _ZFS_FLETCHER_H int fletcher_2_incremental_byteswap(void *, size_t, void *);
 | |
| _ZFS_FLETCHER_H void fletcher_4_native_varsize(const void *, uint64_t,
 | |
|     zio_cksum_t *);
 | |
| _ZFS_FLETCHER_H void fletcher_4_byteswap(const void *, uint64_t, const void *,
 | |
|     zio_cksum_t *);
 | |
| _ZFS_FLETCHER_H int fletcher_4_incremental_native(void *, size_t, void *);
 | |
| _ZFS_FLETCHER_H int fletcher_4_incremental_byteswap(void *, size_t, void *);
 | |
| _ZFS_FLETCHER_H int fletcher_4_impl_set(const char *selector);
 | |
| _ZFS_FLETCHER_H void fletcher_4_init(void);
 | |
| _ZFS_FLETCHER_H void fletcher_4_fini(void);
 | |
| 
 | |
| 
 | |
| 
 | |
| /* Internal fletcher ctx */
 | |
| 
 | |
| typedef struct zfs_fletcher_superscalar {
 | |
| 	uint64_t v[4];
 | |
| } zfs_fletcher_superscalar_t;
 | |
| 
 | |
| typedef struct zfs_fletcher_sse {
 | |
| 	uint64_t v[2];
 | |
| } zfs_fletcher_sse_t;
 | |
| 
 | |
| typedef struct zfs_fletcher_avx {
 | |
| 	uint64_t v[4];
 | |
| } zfs_fletcher_avx_t;
 | |
| 
 | |
| typedef struct zfs_fletcher_avx512 {
 | |
| 	uint64_t v[8];
 | |
| } zfs_fletcher_avx512_t;
 | |
| 
 | |
| typedef struct zfs_fletcher_aarch64_neon {
 | |
| 	uint64_t v[2];
 | |
| } zfs_fletcher_aarch64_neon_t;
 | |
| 
 | |
| 
 | |
| typedef union fletcher_4_ctx {
 | |
| 	zio_cksum_t scalar;
 | |
| 	zfs_fletcher_superscalar_t superscalar[4];
 | |
| 
 | |
| #if defined(HAVE_SSE2) || (defined(HAVE_SSE2) && defined(HAVE_SSSE3))
 | |
| 	zfs_fletcher_sse_t sse[4];
 | |
| #endif
 | |
| #if defined(HAVE_AVX) && defined(HAVE_AVX2)
 | |
| 	zfs_fletcher_avx_t avx[4];
 | |
| #endif
 | |
| #if defined(__x86_64) && defined(HAVE_AVX512F)
 | |
| 	zfs_fletcher_avx512_t avx512[4];
 | |
| #endif
 | |
| #if defined(__aarch64__)
 | |
| 	zfs_fletcher_aarch64_neon_t aarch64_neon[4];
 | |
| #endif
 | |
| } fletcher_4_ctx_t;
 | |
| 
 | |
| /*
 | |
|  * fletcher checksum struct
 | |
|  */
 | |
| typedef void (*fletcher_4_init_f)(fletcher_4_ctx_t *);
 | |
| typedef void (*fletcher_4_fini_f)(fletcher_4_ctx_t *, zio_cksum_t *);
 | |
| typedef void (*fletcher_4_compute_f)(fletcher_4_ctx_t *,
 | |
|     const void *, uint64_t);
 | |
| 
 | |
| typedef struct fletcher_4_func {
 | |
| 	fletcher_4_init_f init_native;
 | |
| 	fletcher_4_fini_f fini_native;
 | |
| 	fletcher_4_compute_f compute_native;
 | |
| 	fletcher_4_init_f init_byteswap;
 | |
| 	fletcher_4_fini_f fini_byteswap;
 | |
| 	fletcher_4_compute_f compute_byteswap;
 | |
| 	boolean_t (*valid)(void);
 | |
| 	boolean_t uses_fpu;
 | |
| 	const char *name;
 | |
| } __attribute__((aligned(64))) fletcher_4_ops_t;
 | |
| 
 | |
| _ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_superscalar_ops;
 | |
| _ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_superscalar4_ops;
 | |
| 
 | |
| #if defined(HAVE_SSE2)
 | |
| _ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_sse2_ops;
 | |
| #endif
 | |
| 
 | |
| #if defined(HAVE_SSE2) && defined(HAVE_SSSE3)
 | |
| _ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_ssse3_ops;
 | |
| #endif
 | |
| 
 | |
| #if defined(HAVE_AVX) && defined(HAVE_AVX2)
 | |
| _ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_avx2_ops;
 | |
| #endif
 | |
| 
 | |
| #if defined(__x86_64) && defined(HAVE_AVX512F)
 | |
| _ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_avx512f_ops;
 | |
| #endif
 | |
| 
 | |
| #if defined(__x86_64) && defined(HAVE_AVX512BW)
 | |
| _ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_avx512bw_ops;
 | |
| #endif
 | |
| 
 | |
| #if defined(__aarch64__)
 | |
| _ZFS_FLETCHER_H const fletcher_4_ops_t fletcher_4_aarch64_neon_ops;
 | |
| #endif
 | |
| 
 | |
| #ifdef	__cplusplus
 | |
| }
 | |
| #endif
 | |
| 
 | |
| #endif	/* _ZFS_FLETCHER_H */
 |