|  | /* compare256.c -- 256 byte memory comparison with match length return | 
|  | * Copyright (C) 2020 Nathan Moinvaziri | 
|  | * For conditions of distribution and use, see copyright notice in zlib.h | 
|  | */ | 
|  |  | 
|  | #include "zbuild.h" | 
|  | #include "fallback_builtins.h" | 
|  |  | 
|  | /* ALIGNED, byte comparison */ | 
|  | static inline uint32_t compare256_c_static(const uint8_t *src0, const uint8_t *src1) { | 
|  | uint32_t len = 0; | 
|  |  | 
|  | do { | 
|  | if (*src0 != *src1) | 
|  | return len; | 
|  | src0 += 1, src1 += 1, len += 1; | 
|  | if (*src0 != *src1) | 
|  | return len; | 
|  | src0 += 1, src1 += 1, len += 1; | 
|  | if (*src0 != *src1) | 
|  | return len; | 
|  | src0 += 1, src1 += 1, len += 1; | 
|  | if (*src0 != *src1) | 
|  | return len; | 
|  | src0 += 1, src1 += 1, len += 1; | 
|  | if (*src0 != *src1) | 
|  | return len; | 
|  | src0 += 1, src1 += 1, len += 1; | 
|  | if (*src0 != *src1) | 
|  | return len; | 
|  | src0 += 1, src1 += 1, len += 1; | 
|  | if (*src0 != *src1) | 
|  | return len; | 
|  | src0 += 1, src1 += 1, len += 1; | 
|  | if (*src0 != *src1) | 
|  | return len; | 
|  | src0 += 1, src1 += 1, len += 1; | 
|  | } while (len < 256); | 
|  |  | 
|  | return 256; | 
|  | } | 
|  |  | 
|  | Z_INTERNAL uint32_t compare256_c(const uint8_t *src0, const uint8_t *src1) { | 
|  | return compare256_c_static(src0, src1); | 
|  | } | 
|  |  | 
|  | #define LONGEST_MATCH       longest_match_c | 
|  | #define COMPARE256          compare256_c_static | 
|  |  | 
|  | #include "match_tpl.h" | 
|  |  | 
|  | #define LONGEST_MATCH_SLOW | 
|  | #define LONGEST_MATCH       longest_match_slow_c | 
|  | #define COMPARE256          compare256_c_static | 
|  |  | 
|  | #include "match_tpl.h" | 
|  |  | 
|  | #ifdef UNALIGNED_OK | 
|  | /* 16-bit unaligned integer comparison */ | 
|  | static inline uint32_t compare256_unaligned_16_static(const uint8_t *src0, const uint8_t *src1) { | 
|  | uint32_t len = 0; | 
|  |  | 
|  | do { | 
|  | if (zmemcmp_2(src0, src1) != 0) | 
|  | return len + (*src0 == *src1); | 
|  | src0 += 2, src1 += 2, len += 2; | 
|  | if (zmemcmp_2(src0, src1) != 0) | 
|  | return len + (*src0 == *src1); | 
|  | src0 += 2, src1 += 2, len += 2; | 
|  | if (zmemcmp_2(src0, src1) != 0) | 
|  | return len + (*src0 == *src1); | 
|  | src0 += 2, src1 += 2, len += 2; | 
|  | if (zmemcmp_2(src0, src1) != 0) | 
|  | return len + (*src0 == *src1); | 
|  | src0 += 2, src1 += 2, len += 2; | 
|  | } while (len < 256); | 
|  |  | 
|  | return 256; | 
|  | } | 
|  |  | 
|  | Z_INTERNAL uint32_t compare256_unaligned_16(const uint8_t *src0, const uint8_t *src1) { | 
|  | return compare256_unaligned_16_static(src0, src1); | 
|  | } | 
|  |  | 
|  | #define LONGEST_MATCH       longest_match_unaligned_16 | 
|  | #define COMPARE256          compare256_unaligned_16_static | 
|  |  | 
|  | #include "match_tpl.h" | 
|  |  | 
|  | #define LONGEST_MATCH_SLOW | 
|  | #define LONGEST_MATCH       longest_match_slow_unaligned_16 | 
|  | #define COMPARE256          compare256_unaligned_16_static | 
|  |  | 
|  | #include "match_tpl.h" | 
|  |  | 
|  | #ifdef HAVE_BUILTIN_CTZ | 
|  | /* 32-bit unaligned integer comparison */ | 
|  | static inline uint32_t compare256_unaligned_32_static(const uint8_t *src0, const uint8_t *src1) { | 
|  | uint32_t len = 0; | 
|  |  | 
|  | do { | 
|  | uint32_t sv, mv, diff; | 
|  |  | 
|  | zmemcpy_4(&sv, src0); | 
|  | zmemcpy_4(&mv, src1); | 
|  |  | 
|  | diff = sv ^ mv; | 
|  | if (diff) { | 
|  | uint32_t match_byte = __builtin_ctz(diff) / 8; | 
|  | return len + match_byte; | 
|  | } | 
|  |  | 
|  | src0 += 4, src1 += 4, len += 4; | 
|  | } while (len < 256); | 
|  |  | 
|  | return 256; | 
|  | } | 
|  |  | 
|  | Z_INTERNAL uint32_t compare256_unaligned_32(const uint8_t *src0, const uint8_t *src1) { | 
|  | return compare256_unaligned_32_static(src0, src1); | 
|  | } | 
|  |  | 
|  | #define LONGEST_MATCH       longest_match_unaligned_32 | 
|  | #define COMPARE256          compare256_unaligned_32_static | 
|  |  | 
|  | #include "match_tpl.h" | 
|  |  | 
|  | #define LONGEST_MATCH_SLOW | 
|  | #define LONGEST_MATCH       longest_match_slow_unaligned_32 | 
|  | #define COMPARE256          compare256_unaligned_32_static | 
|  |  | 
|  | #include "match_tpl.h" | 
|  |  | 
|  | #endif | 
|  |  | 
|  | #if defined(UNALIGNED64_OK) && defined(HAVE_BUILTIN_CTZLL) | 
|  | /* UNALIGNED64_OK, 64-bit integer comparison */ | 
|  | static inline uint32_t compare256_unaligned_64_static(const uint8_t *src0, const uint8_t *src1) { | 
|  | uint32_t len = 0; | 
|  |  | 
|  | do { | 
|  | uint64_t sv, mv, diff; | 
|  |  | 
|  | zmemcpy_8(&sv, src0); | 
|  | zmemcpy_8(&mv, src1); | 
|  |  | 
|  | diff = sv ^ mv; | 
|  | if (diff) { | 
|  | uint64_t match_byte = __builtin_ctzll(diff) / 8; | 
|  | return len + (uint32_t)match_byte; | 
|  | } | 
|  |  | 
|  | src0 += 8, src1 += 8, len += 8; | 
|  | } while (len < 256); | 
|  |  | 
|  | return 256; | 
|  | } | 
|  |  | 
|  | Z_INTERNAL uint32_t compare256_unaligned_64(const uint8_t *src0, const uint8_t *src1) { | 
|  | return compare256_unaligned_64_static(src0, src1); | 
|  | } | 
|  |  | 
|  | #define LONGEST_MATCH       longest_match_unaligned_64 | 
|  | #define COMPARE256          compare256_unaligned_64_static | 
|  |  | 
|  | #include "match_tpl.h" | 
|  |  | 
|  | #define LONGEST_MATCH_SLOW | 
|  | #define LONGEST_MATCH       longest_match_slow_unaligned_64 | 
|  | #define COMPARE256          compare256_unaligned_64_static | 
|  |  | 
|  | #include "match_tpl.h" | 
|  |  | 
|  | #endif | 
|  |  | 
|  | #endif |