1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128
|
#ifndef AWS_CHECKSUMS_PRIVATE_CRC_UTIL_H
#define AWS_CHECKSUMS_PRIVATE_CRC_UTIL_H
/**
* Copyright Amazon.com, Inc. or its affiliates. All Rights Reserved.
* SPDX-License-Identifier: Apache-2.0.
*/
#include <aws/common/byte_order.h>
#include <aws/common/cpuid.h>
#include <aws/common/stdint.h>
#include <limits.h>
#include <stdlib.h>
#define large_buffer_apply_impl(Name, T) \
static T aws_large_buffer_apply_##Name( \
T (*checksum_fn)(const uint8_t *, int, T), const uint8_t *buffer, size_t length, T previous) { \
T val = previous; \
while (length > INT_MAX) { \
val = checksum_fn(buffer, INT_MAX, val); \
buffer += (size_t)INT_MAX; \
length -= (size_t)INT_MAX; \
} \
val = checksum_fn(buffer, (int)length, val); \
return val; \
}
/* helper function to reverse byte order on big-endian platforms*/
static inline uint32_t aws_bswap32_if_be(uint32_t x) {
if (!aws_is_big_endian()) {
return x;
}
#if _MSC_VER
return _byteswap_ulong(x);
#elif defined(__GNUC__) && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 8))
return __builtin_bswap32(x);
#elif defined(__clang__) && __clang_major__ >= 3
return __builtin_bswap32(x);
#else
return (
((x & 0xff000000u) >> 24) | ((x & 0x00ff0000u) >> 8) | ((x & 0x0000ff00u) << 8) | ((x & 0x000000ffu) << 24));
#endif
}
/* Reverse the bytes in a 64-bit word. */
static inline uint64_t aws_bswap64_if_be(uint64_t x) {
if (!aws_is_big_endian()) {
return x;
}
#if _MSC_VER
return _byteswap_uint64(x);
#elif defined(__GNUC__) && (__GNUC__ > 4 || (__GNUC__ == 4 && __GNUC_MINOR__ >= 8))
/* Note: gcc supports it starting with 4.2. here its just picking the lowest version we run test on. */
return __builtin_bswap64(x);
#elif defined(__clang__) && __clang_major__ >= 3
return __builtin_bswap64(x);
#else
return ((x << 56) & 0xff00000000000000ULL) | ((x << 40) & 0x00ff000000000000ULL) |
((x << 24) & 0x0000ff0000000000ULL) | ((x << 8) & 0x000000ff00000000ULL) |
((x >> 8) & 0x00000000ff000000ULL) | ((x >> 24) & 0x0000000000ff0000ULL) |
((x >> 40) & 0x000000000000ff00ULL) | ((x >> 56) & 0x00000000000000ffULL);
#endif
}
/**
* Force resolution of any global variables for CRC32.
* Note: in usual flow those are resolved on the first call to crc32 functions, which
* which might be deemed non-thread safe by some tools.
*/
void aws_checksums_crc32_init(void);
/**
* Force resolution of any global variables for CRC64.
* Note: in usual flow those are resolved on the first call to crc64 functions, which
* which might be deemed non-thread safe by some tools.
*/
void aws_checksums_crc64_init(void);
/**
* Note: this is slightly different from our typical pattern.
* This check is currently performed in a tight loop, so jumping through
* some hoops with inlining to avoid perf regressions, which forces
* below functions to be declared in a header.
*/
extern bool s_detection_performed;
extern bool s_detected_sse42;
extern bool s_detected_avx512;
extern bool s_detected_clmul;
extern bool s_detected_vpclmulqdq;
static inline void aws_checksums_init_detection_cache(void) {
s_detected_clmul = aws_cpu_has_feature(AWS_CPU_FEATURE_CLMUL);
s_detected_sse42 = aws_cpu_has_feature(AWS_CPU_FEATURE_SSE_4_2);
s_detected_avx512 = aws_cpu_has_feature(AWS_CPU_FEATURE_AVX512);
s_detected_clmul = aws_cpu_has_feature(AWS_CPU_FEATURE_CLMUL);
s_detected_vpclmulqdq = aws_cpu_has_feature(AWS_CPU_FEATURE_VPCLMULQDQ);
}
static inline bool aws_cpu_has_clmul_cached(void) {
if (AWS_UNLIKELY(!s_detection_performed)) {
aws_checksums_init_detection_cache();
}
return s_detected_clmul;
}
static inline bool aws_cpu_has_sse42_cached(void) {
if (AWS_UNLIKELY(!s_detection_performed)) {
aws_checksums_init_detection_cache();
}
return s_detected_sse42;
}
static inline bool aws_cpu_has_avx512_cached(void) {
if (AWS_UNLIKELY(!s_detection_performed)) {
aws_checksums_init_detection_cache();
}
return s_detected_avx512;
}
static inline bool aws_cpu_has_vpclmulqdq_cached(void) {
if (AWS_UNLIKELY(!s_detection_performed)) {
aws_checksums_init_detection_cache();
}
return s_detected_vpclmulqdq;
}
#endif /* AWS_CHECKSUMS_PRIVATE_CRC_UTIL_H */
|