diff options
| author | Cameron Cawley <ccawley2011@gmail.com> | 2024-02-22 12:09:51 +0000 |
|---|---|---|
| committer | Hans Kristian Rosbach <hk-github@circlestorm.org> | 2024-02-22 20:20:42 +0100 |
| commit | d745a9bc24e523853de36a4206d8e04acd3c67c7 (patch) | |
| tree | 2db252d05a7cf5dc4d5b9618f463986c7db88be6 | |
| parent | 49b7760d7a3cbedab4bfcfc5505ad13bfe4bc16a (diff) | |
| download | Project-Tick-d745a9bc24e523853de36a4206d8e04acd3c67c7.tar.gz Project-Tick-d745a9bc24e523853de36a4206d8e04acd3c67c7.zip | |
Remove mixing of SSE2 and SSSE3 chunkset code
| -rw-r--r-- | arch/x86/chunkset_ssse3.c | 12 |
1 files changed, 2 insertions, 10 deletions
diff --git a/arch/x86/chunkset_ssse3.c b/arch/x86/chunkset_ssse3.c index 7ff16a4f65..722ecd3d51 100644 --- a/arch/x86/chunkset_ssse3.c +++ b/arch/x86/chunkset_ssse3.c @@ -4,9 +4,6 @@ #include "zbuild.h" -/* This requires SSE2 support. While it's implicit with SSSE3, we can minimize - * code size by sharing the chunkcopy functions, which will certainly compile - * to identical machine code */ #if defined(X86_SSSE3) #include <immintrin.h> #include "../generic/chunk_permute_table.h" @@ -19,8 +16,6 @@ typedef __m128i chunk_t; #define HAVE_CHUNKMEMSET_4 #define HAVE_CHUNKMEMSET_8 #define HAVE_CHUNK_MAG -#define HAVE_CHUNKCOPY -#define HAVE_CHUNKUNROLL static const lut_rem_pair perm_idx_lut[13] = { {0, 1}, /* 3 */ @@ -83,14 +78,11 @@ static inline chunk_t GET_CHUNK_MAG(uint8_t *buf, uint32_t *chunk_rem, uint32_t return ret_vec; } -extern uint8_t* chunkcopy_sse2(uint8_t *out, uint8_t const *from, unsigned len); -extern uint8_t* chunkunroll_sse2(uint8_t *out, unsigned *dist, unsigned *len); - #define CHUNKSIZE chunksize_ssse3 #define CHUNKMEMSET chunkmemset_ssse3 #define CHUNKMEMSET_SAFE chunkmemset_safe_ssse3 -#define CHUNKCOPY chunkcopy_sse2 -#define CHUNKUNROLL chunkunroll_sse2 +#define CHUNKCOPY chunkcopy_ssse3 +#define CHUNKUNROLL chunkunroll_ssse3 #include "chunkset_tpl.h" |
