/src/zlib-ng/arch/x86/chunkset_sse2.c
Line | Count | Source |
1 | | /* chunkset_sse2.c -- SSE2 inline functions to copy small data chunks. |
2 | | * For conditions of distribution and use, see copyright notice in zlib.h |
3 | | */ |
4 | | |
5 | | #ifdef X86_SSE2 |
6 | | |
7 | | #include "zbuild.h" |
8 | | #include "zmemory.h" |
9 | | |
10 | | #include <immintrin.h> |
11 | | |
12 | | typedef __m128i chunk_t; |
13 | | |
14 | | #define HAVE_CHUNKMEMSET_2 |
15 | | #define HAVE_CHUNKMEMSET_4 |
16 | | #define HAVE_CHUNKMEMSET_8 |
17 | | |
18 | 0 | static inline void chunkmemset_2(uint8_t *from, chunk_t *chunk) { |
19 | 0 | *chunk = _mm_set1_epi16(zng_memread_2(from)); |
20 | 0 | } |
21 | | |
22 | 0 | static inline void chunkmemset_4(uint8_t *from, chunk_t *chunk) { |
23 | 0 | *chunk = _mm_set1_epi32(zng_memread_4(from)); |
24 | 0 | } |
25 | | |
26 | 0 | static inline void chunkmemset_8(uint8_t *from, chunk_t *chunk) { |
27 | 0 | *chunk = _mm_set1_epi64x(zng_memread_8(from)); |
28 | 0 | } |
29 | | |
30 | 0 | static inline void loadchunk(uint8_t const *s, chunk_t *chunk) { |
31 | 0 | *chunk = _mm_loadu_si128((__m128i *)s); |
32 | 0 | } |
33 | | |
34 | 0 | static inline void storechunk(uint8_t *out, chunk_t *chunk) { |
35 | 0 | _mm_storeu_si128((__m128i *)out, *chunk); |
36 | 0 | } |
37 | | |
38 | | #define CHUNKSIZE chunksize_sse2 |
39 | 0 | #define CHUNKCOPY chunkcopy_sse2 |
40 | 0 | #define CHUNKUNROLL chunkunroll_sse2 |
41 | 0 | #define CHUNKMEMSET chunkmemset_sse2 |
42 | | #define CHUNKMEMSET_SAFE chunkmemset_safe_sse2 |
43 | | |
44 | | #include "chunkset_tpl.h" |
45 | | |
46 | | #define INFLATE_FAST inflate_fast_sse2 |
47 | | |
48 | | #include "inffast_tpl.h" |
49 | | |
50 | | #endif |