1 /*-------------------------------------------------------------------------
4 * Compute CRC-32C checksum using Intel SSE 4.2 instructions.
6 * Portions Copyright (c) 1996-2023, PostgreSQL Global Development Group
7 * Portions Copyright (c) 1994, Regents of the University of California
11 * src/port/pg_crc32c_sse42.c
13 *-------------------------------------------------------------------------
17 #include <nmmintrin.h>
19 #include "port/pg_crc32c.h"
21 pg_attribute_no_sanitize_alignment()
23 pg_comp_crc32c_sse42(pg_crc32c crc
, const void *data
, size_t len
)
25 const unsigned char *p
= data
;
26 const unsigned char *pend
= p
+ len
;
29 * Process eight bytes of data at a time.
31 * NB: We do unaligned accesses here. The Intel architecture allows that,
32 * and performance testing didn't show any performance gain from aligning
38 crc
= (uint32
) _mm_crc32_u64(crc
, *((const uint64
*) p
));
42 /* Process remaining full four bytes if any */
45 crc
= _mm_crc32_u32(crc
, *((const unsigned int *) p
));
51 * Process four bytes at a time. (The eight byte instruction is not
52 * available on the 32-bit x86 architecture).
56 crc
= _mm_crc32_u32(crc
, *((const unsigned int *) p
));
59 #endif /* __x86_64__ */
61 /* Process any remaining bytes one at a time. */
64 crc
= _mm_crc32_u8(crc
, *p
);