mirror of
https://github.com/facebook/zstd.git
synced 2025-10-07 00:12:40 -04:00
update xxhash to v0.6.2
This commit is contained in:
parent
0486bb78c6
commit
8ded0b84aa
@ -132,7 +132,7 @@ static void* XXH_memcpy(void* dest, const void* src, size_t size) { return memcp
|
|||||||
***************************************/
|
***************************************/
|
||||||
#ifndef MEM_MODULE
|
#ifndef MEM_MODULE
|
||||||
# define MEM_MODULE
|
# define MEM_MODULE
|
||||||
# if defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L /* C99 */
|
# if !defined (__VMS) && (defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */) )
|
||||||
# include <stdint.h>
|
# include <stdint.h>
|
||||||
typedef uint8_t BYTE;
|
typedef uint8_t BYTE;
|
||||||
typedef uint16_t U16;
|
typedef uint16_t U16;
|
||||||
@ -144,7 +144,7 @@ static void* XXH_memcpy(void* dest, const void* src, size_t size) { return memcp
|
|||||||
typedef unsigned short U16;
|
typedef unsigned short U16;
|
||||||
typedef unsigned int U32;
|
typedef unsigned int U32;
|
||||||
typedef signed int S32;
|
typedef signed int S32;
|
||||||
typedef unsigned long long U64;
|
typedef unsigned long long U64; /* if your compiler doesn't support unsigned long long, replace by another 64-bit type here. Note that xxhash.h will also need to be updated. */
|
||||||
# endif
|
# endif
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
@ -307,6 +307,20 @@ static const U64 PRIME64_5 = 2870177450012600261ULL;
|
|||||||
XXH_PUBLIC_API unsigned XXH_versionNumber (void) { return XXH_VERSION_NUMBER; }
|
XXH_PUBLIC_API unsigned XXH_versionNumber (void) { return XXH_VERSION_NUMBER; }
|
||||||
|
|
||||||
|
|
||||||
|
/* **************************
|
||||||
|
* Utils
|
||||||
|
****************************/
|
||||||
|
XXH_PUBLIC_API void XXH32_copyState(XXH32_state_t* restrict dstState, const XXH32_state_t* restrict srcState)
|
||||||
|
{
|
||||||
|
memcpy(dstState, srcState, sizeof(*dstState));
|
||||||
|
}
|
||||||
|
|
||||||
|
XXH_PUBLIC_API void XXH64_copyState(XXH64_state_t* restrict dstState, const XXH64_state_t* restrict srcState)
|
||||||
|
{
|
||||||
|
memcpy(dstState, srcState, sizeof(*dstState));
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
/* ***************************
|
/* ***************************
|
||||||
* Simple Hash Functions
|
* Simple Hash Functions
|
||||||
*****************************/
|
*****************************/
|
||||||
@ -545,8 +559,7 @@ XXH_PUBLIC_API XXH_errorcode XXH64_freeState(XXH64_state_t* statePtr)
|
|||||||
XXH_PUBLIC_API XXH_errorcode XXH32_reset(XXH32_state_t* statePtr, unsigned int seed)
|
XXH_PUBLIC_API XXH_errorcode XXH32_reset(XXH32_state_t* statePtr, unsigned int seed)
|
||||||
{
|
{
|
||||||
XXH32_state_t state; /* using a local state to memcpy() in order to avoid strict-aliasing warnings */
|
XXH32_state_t state; /* using a local state to memcpy() in order to avoid strict-aliasing warnings */
|
||||||
memset(&state, 0, sizeof(state));
|
memset(&state, 0, sizeof(state)-4); /* do not write into reserved, for future removal */
|
||||||
state.seed = seed;
|
|
||||||
state.v1 = seed + PRIME32_1 + PRIME32_2;
|
state.v1 = seed + PRIME32_1 + PRIME32_2;
|
||||||
state.v2 = seed + PRIME32_2;
|
state.v2 = seed + PRIME32_2;
|
||||||
state.v3 = seed + 0;
|
state.v3 = seed + 0;
|
||||||
@ -559,8 +572,7 @@ XXH_PUBLIC_API XXH_errorcode XXH32_reset(XXH32_state_t* statePtr, unsigned int s
|
|||||||
XXH_PUBLIC_API XXH_errorcode XXH64_reset(XXH64_state_t* statePtr, unsigned long long seed)
|
XXH_PUBLIC_API XXH_errorcode XXH64_reset(XXH64_state_t* statePtr, unsigned long long seed)
|
||||||
{
|
{
|
||||||
XXH64_state_t state; /* using a local state to memcpy() in order to avoid strict-aliasing warnings */
|
XXH64_state_t state; /* using a local state to memcpy() in order to avoid strict-aliasing warnings */
|
||||||
memset(&state, 0, sizeof(state));
|
memset(&state, 0, sizeof(state)-8); /* do not write into reserved, for future removal */
|
||||||
state.seed = seed;
|
|
||||||
state.v1 = seed + PRIME64_1 + PRIME64_2;
|
state.v1 = seed + PRIME64_1 + PRIME64_2;
|
||||||
state.v2 = seed + PRIME64_2;
|
state.v2 = seed + PRIME64_2;
|
||||||
state.v3 = seed + 0;
|
state.v3 = seed + 0;
|
||||||
@ -579,7 +591,8 @@ FORCE_INLINE XXH_errorcode XXH32_update_endian (XXH32_state_t* state, const void
|
|||||||
if (input==NULL) return XXH_ERROR;
|
if (input==NULL) return XXH_ERROR;
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
state->total_len += len;
|
state->total_len_32 += len;
|
||||||
|
state->large_len |= (len>=16) | (state->total_len_32>=16);
|
||||||
|
|
||||||
if (state->memsize + len < 16) { /* fill in tmp buffer */
|
if (state->memsize + len < 16) { /* fill in tmp buffer */
|
||||||
XXH_memcpy((BYTE*)(state->mem32) + state->memsize, input, len);
|
XXH_memcpy((BYTE*)(state->mem32) + state->memsize, input, len);
|
||||||
@ -645,13 +658,13 @@ FORCE_INLINE U32 XXH32_digest_endian (const XXH32_state_t* state, XXH_endianess
|
|||||||
const BYTE* const bEnd = (const BYTE*)(state->mem32) + state->memsize;
|
const BYTE* const bEnd = (const BYTE*)(state->mem32) + state->memsize;
|
||||||
U32 h32;
|
U32 h32;
|
||||||
|
|
||||||
if (state->total_len >= 16) {
|
if (state->large_len) {
|
||||||
h32 = XXH_rotl32(state->v1, 1) + XXH_rotl32(state->v2, 7) + XXH_rotl32(state->v3, 12) + XXH_rotl32(state->v4, 18);
|
h32 = XXH_rotl32(state->v1, 1) + XXH_rotl32(state->v2, 7) + XXH_rotl32(state->v3, 12) + XXH_rotl32(state->v4, 18);
|
||||||
} else {
|
} else {
|
||||||
h32 = state->seed + PRIME32_5;
|
h32 = state->v3 /* == seed */ + PRIME32_5;
|
||||||
}
|
}
|
||||||
|
|
||||||
h32 += (U32) state->total_len;
|
h32 += state->total_len_32;
|
||||||
|
|
||||||
while (p+4<=bEnd) {
|
while (p+4<=bEnd) {
|
||||||
h32 += XXH_readLE32(p, endian) * PRIME32_3;
|
h32 += XXH_readLE32(p, endian) * PRIME32_3;
|
||||||
@ -774,7 +787,7 @@ FORCE_INLINE U64 XXH64_digest_endian (const XXH64_state_t* state, XXH_endianess
|
|||||||
h64 = XXH64_mergeRound(h64, v3);
|
h64 = XXH64_mergeRound(h64, v3);
|
||||||
h64 = XXH64_mergeRound(h64, v4);
|
h64 = XXH64_mergeRound(h64, v4);
|
||||||
} else {
|
} else {
|
||||||
h64 = state->seed + PRIME64_5;
|
h64 = state->v3 + PRIME64_5;
|
||||||
}
|
}
|
||||||
|
|
||||||
h64 += (U64) state->total_len;
|
h64 += (U64) state->total_len;
|
||||||
|
@ -82,18 +82,21 @@ typedef enum { XXH_OK=0, XXH_ERROR } XXH_errorcode;
|
|||||||
/* ****************************
|
/* ****************************
|
||||||
* API modifier
|
* API modifier
|
||||||
******************************/
|
******************************/
|
||||||
/*!XXH_PRIVATE_API
|
/** XXH_PRIVATE_API
|
||||||
* Transforms all publics symbols within `xxhash.c` into private ones.
|
* This is useful if you want to include xxhash functions in `static` mode
|
||||||
* Methodology :
|
* in order to inline them, and remove their symbol from the public list.
|
||||||
* instead of : #include "xxhash.h"
|
* Methodology :
|
||||||
* do :
|
|
||||||
* #define XXH_PRIVATE_API
|
* #define XXH_PRIVATE_API
|
||||||
* #include "xxhash.c" // note the .c , instead of .h
|
* #include "xxhash.h"
|
||||||
* also : don't compile and link xxhash.c separately
|
* `xxhash.c` is automatically included.
|
||||||
|
* It's not useful to compile and link it as a separate module anymore.
|
||||||
*/
|
*/
|
||||||
#ifdef XXH_PRIVATE_API
|
#ifdef XXH_PRIVATE_API
|
||||||
|
# ifndef XXH_STATIC_LINKING_ONLY
|
||||||
|
# define XXH_STATIC_LINKING_ONLY
|
||||||
|
# endif
|
||||||
# if defined(__GNUC__)
|
# if defined(__GNUC__)
|
||||||
# define XXH_PUBLIC_API static __attribute__((unused))
|
# define XXH_PUBLIC_API static __inline __attribute__((unused))
|
||||||
# elif defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */)
|
# elif defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */)
|
||||||
# define XXH_PUBLIC_API static inline
|
# define XXH_PUBLIC_API static inline
|
||||||
# elif defined(_MSC_VER)
|
# elif defined(_MSC_VER)
|
||||||
@ -103,17 +106,17 @@ typedef enum { XXH_OK=0, XXH_ERROR } XXH_errorcode;
|
|||||||
# endif
|
# endif
|
||||||
#else
|
#else
|
||||||
# define XXH_PUBLIC_API /* do nothing */
|
# define XXH_PUBLIC_API /* do nothing */
|
||||||
#endif
|
#endif /* XXH_PRIVATE_API */
|
||||||
|
|
||||||
/*!XXH_NAMESPACE, aka Namespace Emulation :
|
/*!XXH_NAMESPACE, aka Namespace Emulation :
|
||||||
|
|
||||||
If you want to include _and expose_ xxHash functions from within your own library,
|
If you want to include _and expose_ xxHash functions from within your own library,
|
||||||
but also want to avoid symbol collisions with another library which also includes xxHash,
|
but also want to avoid symbol collisions with another library which also includes xxHash,
|
||||||
|
|
||||||
you can use XXH_NAMESPACE, to automatically prefix any public symbol from `xxhash.c`
|
you can use XXH_NAMESPACE, to automatically prefix any public symbol from xxhash library
|
||||||
with the value of XXH_NAMESPACE (so avoid to keep it NULL and avoid numeric values).
|
with the value of XXH_NAMESPACE (so avoid to keep it NULL and avoid numeric values).
|
||||||
|
|
||||||
Note that no change is required within the calling program as long as it also includes `xxhash.h` :
|
Note that no change is required within the calling program as long as it includes `xxhash.h` :
|
||||||
regular symbol name will be automatically translated by this header.
|
regular symbol name will be automatically translated by this header.
|
||||||
*/
|
*/
|
||||||
#ifdef XXH_NAMESPACE
|
#ifdef XXH_NAMESPACE
|
||||||
@ -132,6 +135,12 @@ regular symbol name will be automatically translated by this header.
|
|||||||
# define XXH64_update XXH_NAME2(XXH_NAMESPACE, XXH64_update)
|
# define XXH64_update XXH_NAME2(XXH_NAMESPACE, XXH64_update)
|
||||||
# define XXH32_digest XXH_NAME2(XXH_NAMESPACE, XXH32_digest)
|
# define XXH32_digest XXH_NAME2(XXH_NAMESPACE, XXH32_digest)
|
||||||
# define XXH64_digest XXH_NAME2(XXH_NAMESPACE, XXH64_digest)
|
# define XXH64_digest XXH_NAME2(XXH_NAMESPACE, XXH64_digest)
|
||||||
|
# define XXH32_copyState XXH_NAME2(XXH_NAMESPACE, XXH32_copyState)
|
||||||
|
# define XXH64_copyState XXH_NAME2(XXH_NAMESPACE, XXH64_copyState)
|
||||||
|
# define XXH32_canonicalFromHash XXH_NAME2(XXH_NAMESPACE, XXH32_canonicalFromHash)
|
||||||
|
# define XXH64_canonicalFromHash XXH_NAME2(XXH_NAMESPACE, XXH64_canonicalFromHash)
|
||||||
|
# define XXH32_hashFromCanonical XXH_NAME2(XXH_NAMESPACE, XXH32_hashFromCanonical)
|
||||||
|
# define XXH64_hashFromCanonical XXH_NAME2(XXH_NAMESPACE, XXH64_hashFromCanonical)
|
||||||
#endif
|
#endif
|
||||||
|
|
||||||
|
|
||||||
@ -140,7 +149,7 @@ regular symbol name will be automatically translated by this header.
|
|||||||
***************************************/
|
***************************************/
|
||||||
#define XXH_VERSION_MAJOR 0
|
#define XXH_VERSION_MAJOR 0
|
||||||
#define XXH_VERSION_MINOR 6
|
#define XXH_VERSION_MINOR 6
|
||||||
#define XXH_VERSION_RELEASE 0
|
#define XXH_VERSION_RELEASE 2
|
||||||
#define XXH_VERSION_NUMBER (XXH_VERSION_MAJOR *100*100 + XXH_VERSION_MINOR *100 + XXH_VERSION_RELEASE)
|
#define XXH_VERSION_NUMBER (XXH_VERSION_MAJOR *100*100 + XXH_VERSION_MINOR *100 + XXH_VERSION_RELEASE)
|
||||||
XXH_PUBLIC_API unsigned XXH_versionNumber (void);
|
XXH_PUBLIC_API unsigned XXH_versionNumber (void);
|
||||||
|
|
||||||
@ -163,7 +172,7 @@ XXH32() :
|
|||||||
XXH64() :
|
XXH64() :
|
||||||
Calculate the 64-bits hash of sequence of length "len" stored at memory address "input".
|
Calculate the 64-bits hash of sequence of length "len" stored at memory address "input".
|
||||||
"seed" can be used to alter the result predictably.
|
"seed" can be used to alter the result predictably.
|
||||||
This function runs faster on 64-bits systems, but slower on 32-bits systems (see benchmark).
|
This function runs 2x faster on 64-bits systems, but slower on 32-bits systems (see benchmark).
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
|
||||||
@ -173,8 +182,7 @@ XXH64() :
|
|||||||
typedef struct XXH32_state_s XXH32_state_t; /* incomplete type */
|
typedef struct XXH32_state_s XXH32_state_t; /* incomplete type */
|
||||||
typedef struct XXH64_state_s XXH64_state_t; /* incomplete type */
|
typedef struct XXH64_state_s XXH64_state_t; /* incomplete type */
|
||||||
|
|
||||||
/*! Dynamic allocation of states
|
/*! State allocation, compatible with dynamic libraries */
|
||||||
Compatible with dynamic libraries */
|
|
||||||
|
|
||||||
XXH_PUBLIC_API XXH32_state_t* XXH32_createState(void);
|
XXH_PUBLIC_API XXH32_state_t* XXH32_createState(void);
|
||||||
XXH_PUBLIC_API XXH_errorcode XXH32_freeState(XXH32_state_t* statePtr);
|
XXH_PUBLIC_API XXH_errorcode XXH32_freeState(XXH32_state_t* statePtr);
|
||||||
@ -193,28 +201,40 @@ XXH_PUBLIC_API XXH_errorcode XXH64_reset (XXH64_state_t* statePtr, unsigned lon
|
|||||||
XXH_PUBLIC_API XXH_errorcode XXH64_update (XXH64_state_t* statePtr, const void* input, size_t length);
|
XXH_PUBLIC_API XXH_errorcode XXH64_update (XXH64_state_t* statePtr, const void* input, size_t length);
|
||||||
XXH_PUBLIC_API XXH64_hash_t XXH64_digest (const XXH64_state_t* statePtr);
|
XXH_PUBLIC_API XXH64_hash_t XXH64_digest (const XXH64_state_t* statePtr);
|
||||||
|
|
||||||
/*!
|
/*
|
||||||
These functions generate the xxHash of an input provided in multiple segments,
|
These functions generate the xxHash of an input provided in multiple segments.
|
||||||
as opposed to provided as a single block.
|
Note that, for small input, they are slower than single-call functions, due to state management.
|
||||||
|
For small input, prefer `XXH32()` and `XXH64()` .
|
||||||
|
|
||||||
XXH state must first be allocated, using either static or dynamic method provided above.
|
XXH state must first be allocated, using XXH*_createState() .
|
||||||
|
|
||||||
Start a new hash by initializing state with a seed, using XXHnn_reset().
|
Start a new hash by initializing state with a seed, using XXH*_reset().
|
||||||
|
|
||||||
Then, feed the hash state by calling XXHnn_update() as many times as necessary.
|
Then, feed the hash state by calling XXH*_update() as many times as necessary.
|
||||||
Obviously, input must be valid, hence allocated and read accessible.
|
Obviously, input must be allocated and read accessible.
|
||||||
The function returns an error code, with 0 meaning OK, and any other value meaning there is an error.
|
The function returns an error code, with 0 meaning OK, and any other value meaning there is an error.
|
||||||
|
|
||||||
Finally, a hash value can be produced anytime, by using XXHnn_digest().
|
Finally, a hash value can be produced anytime, by using XXH*_digest().
|
||||||
This function returns the nn-bits hash as an int or long long.
|
This function returns the nn-bits hash as an int or long long.
|
||||||
|
|
||||||
It's still possible to continue inserting input into the hash state after a digest,
|
It's still possible to continue inserting input into the hash state after a digest,
|
||||||
and later on generate some new hashes, by calling again XXHnn_digest().
|
and generate some new hashes later on, by calling again XXH*_digest().
|
||||||
|
|
||||||
When done, free XXH state space if it was allocated dynamically.
|
When done, free XXH state space if it was allocated dynamically.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
|
||||||
|
/* **************************
|
||||||
|
* Utils
|
||||||
|
****************************/
|
||||||
|
#if !(defined(__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L)) /* ! C99 */
|
||||||
|
# define restrict /* disable restrict */
|
||||||
|
#endif
|
||||||
|
|
||||||
|
XXH_PUBLIC_API void XXH32_copyState(XXH32_state_t* restrict dst_state, const XXH32_state_t* restrict src_state);
|
||||||
|
XXH_PUBLIC_API void XXH64_copyState(XXH64_state_t* restrict dst_state, const XXH64_state_t* restrict src_state);
|
||||||
|
|
||||||
|
|
||||||
/* **************************
|
/* **************************
|
||||||
* Canonical representation
|
* Canonical representation
|
||||||
****************************/
|
****************************/
|
||||||
@ -227,43 +247,55 @@ XXH_PUBLIC_API void XXH64_canonicalFromHash(XXH64_canonical_t* dst, XXH64_hash_t
|
|||||||
XXH_PUBLIC_API XXH32_hash_t XXH32_hashFromCanonical(const XXH32_canonical_t* src);
|
XXH_PUBLIC_API XXH32_hash_t XXH32_hashFromCanonical(const XXH32_canonical_t* src);
|
||||||
XXH_PUBLIC_API XXH64_hash_t XXH64_hashFromCanonical(const XXH64_canonical_t* src);
|
XXH_PUBLIC_API XXH64_hash_t XXH64_hashFromCanonical(const XXH64_canonical_t* src);
|
||||||
|
|
||||||
/*! Default result type for XXH functions are primitive unsigned 32 and 64 bits.
|
/* Default result type for XXH functions are primitive unsigned 32 and 64 bits.
|
||||||
* The canonical representation uses human-readable write convention, aka big-endian (large digits first).
|
* The canonical representation uses human-readable write convention, aka big-endian (large digits first).
|
||||||
* These functions allow transformation of hash result into and from its canonical format.
|
* These functions allow transformation of hash result into and from its canonical format.
|
||||||
* This way, hash values can be written into a file / memory, and remain comparable on different systems and programs.
|
* This way, hash values can be written into a file / memory, and remain comparable on different systems and programs.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
|
|
||||||
#ifdef XXH_STATIC_LINKING_ONLY
|
#ifdef XXH_STATIC_LINKING_ONLY
|
||||||
|
|
||||||
/* This part contains definition which shall only be used with static linking.
|
/* ================================================================================================
|
||||||
The prototypes / types defined here are not guaranteed to remain stable.
|
This section contains definitions which are not guaranteed to remain stable.
|
||||||
They could change in a future version, becoming incompatible with a different version of the library */
|
They may change in future versions, becoming incompatible with a different version of the library.
|
||||||
|
They shall only be used with static linking.
|
||||||
|
Never use these definitions in association with dynamic linking !
|
||||||
|
=================================================================================================== */
|
||||||
|
|
||||||
|
/* These definitions are only meant to allow allocation of XXH state
|
||||||
|
statically, on stack, or in a struct for example.
|
||||||
|
Do not use members directly. */
|
||||||
|
|
||||||
struct XXH32_state_s {
|
struct XXH32_state_s {
|
||||||
unsigned long long total_len;
|
unsigned total_len_32;
|
||||||
unsigned seed;
|
unsigned large_len;
|
||||||
unsigned v1;
|
unsigned v1;
|
||||||
unsigned v2;
|
unsigned v2;
|
||||||
unsigned v3;
|
unsigned v3;
|
||||||
unsigned v4;
|
unsigned v4;
|
||||||
unsigned mem32[4]; /* buffer defined as U32 for alignment */
|
unsigned mem32[4]; /* buffer defined as U32 for alignment */
|
||||||
unsigned memsize;
|
unsigned memsize;
|
||||||
|
unsigned reserved; /* never read nor write, will be removed in a future version */
|
||||||
}; /* typedef'd to XXH32_state_t */
|
}; /* typedef'd to XXH32_state_t */
|
||||||
|
|
||||||
struct XXH64_state_s {
|
struct XXH64_state_s {
|
||||||
unsigned long long total_len;
|
unsigned long long total_len;
|
||||||
unsigned long long seed;
|
|
||||||
unsigned long long v1;
|
unsigned long long v1;
|
||||||
unsigned long long v2;
|
unsigned long long v2;
|
||||||
unsigned long long v3;
|
unsigned long long v3;
|
||||||
unsigned long long v4;
|
unsigned long long v4;
|
||||||
unsigned long long mem64[4]; /* buffer defined as U64 for alignment */
|
unsigned long long mem64[4]; /* buffer defined as U64 for alignment */
|
||||||
unsigned memsize;
|
unsigned memsize;
|
||||||
|
unsigned reserved[2]; /* never read nor write, will be removed in a future version */
|
||||||
}; /* typedef'd to XXH64_state_t */
|
}; /* typedef'd to XXH64_state_t */
|
||||||
|
|
||||||
|
|
||||||
#endif
|
# ifdef XXH_PRIVATE_API
|
||||||
|
# include "xxhash.c" /* include xxhash functions as `static`, for inlining */
|
||||||
|
# endif
|
||||||
|
|
||||||
|
#endif /* XXH_STATIC_LINKING_ONLY */
|
||||||
|
|
||||||
|
|
||||||
#if defined (__cplusplus)
|
#if defined (__cplusplus)
|
||||||
|
Loading…
x
Reference in New Issue
Block a user