update xxhash to v0.6.2

This commit is contained in:
Yann Collet 2016-08-10 07:40:40 +02:00
parent 0486bb78c6
commit 8ded0b84aa
2 changed files with 91 additions and 46 deletions

View File

@ -132,7 +132,7 @@ static void* XXH_memcpy(void* dest, const void* src, size_t size) { return memcp
***************************************/ ***************************************/
#ifndef MEM_MODULE #ifndef MEM_MODULE
# define MEM_MODULE # define MEM_MODULE
# if defined (__STDC_VERSION__) && __STDC_VERSION__ >= 199901L /* C99 */ # if !defined (__VMS) && (defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */) )
# include <stdint.h> # include <stdint.h>
typedef uint8_t BYTE; typedef uint8_t BYTE;
typedef uint16_t U16; typedef uint16_t U16;
@ -144,7 +144,7 @@ static void* XXH_memcpy(void* dest, const void* src, size_t size) { return memcp
typedef unsigned short U16; typedef unsigned short U16;
typedef unsigned int U32; typedef unsigned int U32;
typedef signed int S32; typedef signed int S32;
typedef unsigned long long U64; typedef unsigned long long U64; /* if your compiler doesn't support unsigned long long, replace by another 64-bit type here. Note that xxhash.h will also need to be updated. */
# endif # endif
#endif #endif
@ -307,6 +307,20 @@ static const U64 PRIME64_5 = 2870177450012600261ULL;
XXH_PUBLIC_API unsigned XXH_versionNumber (void) { return XXH_VERSION_NUMBER; } XXH_PUBLIC_API unsigned XXH_versionNumber (void) { return XXH_VERSION_NUMBER; }
/* **************************
* Utils
****************************/
XXH_PUBLIC_API void XXH32_copyState(XXH32_state_t* restrict dstState, const XXH32_state_t* restrict srcState)
{
memcpy(dstState, srcState, sizeof(*dstState));
}
XXH_PUBLIC_API void XXH64_copyState(XXH64_state_t* restrict dstState, const XXH64_state_t* restrict srcState)
{
memcpy(dstState, srcState, sizeof(*dstState));
}
/* *************************** /* ***************************
* Simple Hash Functions * Simple Hash Functions
*****************************/ *****************************/
@ -545,8 +559,7 @@ XXH_PUBLIC_API XXH_errorcode XXH64_freeState(XXH64_state_t* statePtr)
XXH_PUBLIC_API XXH_errorcode XXH32_reset(XXH32_state_t* statePtr, unsigned int seed) XXH_PUBLIC_API XXH_errorcode XXH32_reset(XXH32_state_t* statePtr, unsigned int seed)
{ {
XXH32_state_t state; /* using a local state to memcpy() in order to avoid strict-aliasing warnings */ XXH32_state_t state; /* using a local state to memcpy() in order to avoid strict-aliasing warnings */
memset(&state, 0, sizeof(state)); memset(&state, 0, sizeof(state)-4); /* do not write into reserved, for future removal */
state.seed = seed;
state.v1 = seed + PRIME32_1 + PRIME32_2; state.v1 = seed + PRIME32_1 + PRIME32_2;
state.v2 = seed + PRIME32_2; state.v2 = seed + PRIME32_2;
state.v3 = seed + 0; state.v3 = seed + 0;
@ -559,8 +572,7 @@ XXH_PUBLIC_API XXH_errorcode XXH32_reset(XXH32_state_t* statePtr, unsigned int s
XXH_PUBLIC_API XXH_errorcode XXH64_reset(XXH64_state_t* statePtr, unsigned long long seed) XXH_PUBLIC_API XXH_errorcode XXH64_reset(XXH64_state_t* statePtr, unsigned long long seed)
{ {
XXH64_state_t state; /* using a local state to memcpy() in order to avoid strict-aliasing warnings */ XXH64_state_t state; /* using a local state to memcpy() in order to avoid strict-aliasing warnings */
memset(&state, 0, sizeof(state)); memset(&state, 0, sizeof(state)-8); /* do not write into reserved, for future removal */
state.seed = seed;
state.v1 = seed + PRIME64_1 + PRIME64_2; state.v1 = seed + PRIME64_1 + PRIME64_2;
state.v2 = seed + PRIME64_2; state.v2 = seed + PRIME64_2;
state.v3 = seed + 0; state.v3 = seed + 0;
@ -579,7 +591,8 @@ FORCE_INLINE XXH_errorcode XXH32_update_endian (XXH32_state_t* state, const void
if (input==NULL) return XXH_ERROR; if (input==NULL) return XXH_ERROR;
#endif #endif
state->total_len += len; state->total_len_32 += len;
state->large_len |= (len>=16) | (state->total_len_32>=16);
if (state->memsize + len < 16) { /* fill in tmp buffer */ if (state->memsize + len < 16) { /* fill in tmp buffer */
XXH_memcpy((BYTE*)(state->mem32) + state->memsize, input, len); XXH_memcpy((BYTE*)(state->mem32) + state->memsize, input, len);
@ -645,13 +658,13 @@ FORCE_INLINE U32 XXH32_digest_endian (const XXH32_state_t* state, XXH_endianess
const BYTE* const bEnd = (const BYTE*)(state->mem32) + state->memsize; const BYTE* const bEnd = (const BYTE*)(state->mem32) + state->memsize;
U32 h32; U32 h32;
if (state->total_len >= 16) { if (state->large_len) {
h32 = XXH_rotl32(state->v1, 1) + XXH_rotl32(state->v2, 7) + XXH_rotl32(state->v3, 12) + XXH_rotl32(state->v4, 18); h32 = XXH_rotl32(state->v1, 1) + XXH_rotl32(state->v2, 7) + XXH_rotl32(state->v3, 12) + XXH_rotl32(state->v4, 18);
} else { } else {
h32 = state->seed + PRIME32_5; h32 = state->v3 /* == seed */ + PRIME32_5;
} }
h32 += (U32) state->total_len; h32 += state->total_len_32;
while (p+4<=bEnd) { while (p+4<=bEnd) {
h32 += XXH_readLE32(p, endian) * PRIME32_3; h32 += XXH_readLE32(p, endian) * PRIME32_3;
@ -774,7 +787,7 @@ FORCE_INLINE U64 XXH64_digest_endian (const XXH64_state_t* state, XXH_endianess
h64 = XXH64_mergeRound(h64, v3); h64 = XXH64_mergeRound(h64, v3);
h64 = XXH64_mergeRound(h64, v4); h64 = XXH64_mergeRound(h64, v4);
} else { } else {
h64 = state->seed + PRIME64_5; h64 = state->v3 + PRIME64_5;
} }
h64 += (U64) state->total_len; h64 += (U64) state->total_len;

View File

@ -82,18 +82,21 @@ typedef enum { XXH_OK=0, XXH_ERROR } XXH_errorcode;
/* **************************** /* ****************************
* API modifier * API modifier
******************************/ ******************************/
/*!XXH_PRIVATE_API /** XXH_PRIVATE_API
* Transforms all publics symbols within `xxhash.c` into private ones. * This is useful if you want to include xxhash functions in `static` mode
* Methodology : * in order to inline them, and remove their symbol from the public list.
* instead of : #include "xxhash.h" * Methodology :
* do :
* #define XXH_PRIVATE_API * #define XXH_PRIVATE_API
* #include "xxhash.c" // note the .c , instead of .h * #include "xxhash.h"
* also : don't compile and link xxhash.c separately * `xxhash.c` is automatically included.
* It's not useful to compile and link it as a separate module anymore.
*/ */
#ifdef XXH_PRIVATE_API #ifdef XXH_PRIVATE_API
# ifndef XXH_STATIC_LINKING_ONLY
# define XXH_STATIC_LINKING_ONLY
# endif
# if defined(__GNUC__) # if defined(__GNUC__)
# define XXH_PUBLIC_API static __attribute__((unused)) # define XXH_PUBLIC_API static __inline __attribute__((unused))
# elif defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */) # elif defined (__cplusplus) || (defined (__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L) /* C99 */)
# define XXH_PUBLIC_API static inline # define XXH_PUBLIC_API static inline
# elif defined(_MSC_VER) # elif defined(_MSC_VER)
@ -103,17 +106,17 @@ typedef enum { XXH_OK=0, XXH_ERROR } XXH_errorcode;
# endif # endif
#else #else
# define XXH_PUBLIC_API /* do nothing */ # define XXH_PUBLIC_API /* do nothing */
#endif #endif /* XXH_PRIVATE_API */
/*!XXH_NAMESPACE, aka Namespace Emulation : /*!XXH_NAMESPACE, aka Namespace Emulation :
If you want to include _and expose_ xxHash functions from within your own library, If you want to include _and expose_ xxHash functions from within your own library,
but also want to avoid symbol collisions with another library which also includes xxHash, but also want to avoid symbol collisions with another library which also includes xxHash,
you can use XXH_NAMESPACE, to automatically prefix any public symbol from `xxhash.c` you can use XXH_NAMESPACE, to automatically prefix any public symbol from xxhash library
with the value of XXH_NAMESPACE (so avoid to keep it NULL and avoid numeric values). with the value of XXH_NAMESPACE (so avoid to keep it NULL and avoid numeric values).
Note that no change is required within the calling program as long as it also includes `xxhash.h` : Note that no change is required within the calling program as long as it includes `xxhash.h` :
regular symbol name will be automatically translated by this header. regular symbol name will be automatically translated by this header.
*/ */
#ifdef XXH_NAMESPACE #ifdef XXH_NAMESPACE
@ -132,6 +135,12 @@ regular symbol name will be automatically translated by this header.
# define XXH64_update XXH_NAME2(XXH_NAMESPACE, XXH64_update) # define XXH64_update XXH_NAME2(XXH_NAMESPACE, XXH64_update)
# define XXH32_digest XXH_NAME2(XXH_NAMESPACE, XXH32_digest) # define XXH32_digest XXH_NAME2(XXH_NAMESPACE, XXH32_digest)
# define XXH64_digest XXH_NAME2(XXH_NAMESPACE, XXH64_digest) # define XXH64_digest XXH_NAME2(XXH_NAMESPACE, XXH64_digest)
# define XXH32_copyState XXH_NAME2(XXH_NAMESPACE, XXH32_copyState)
# define XXH64_copyState XXH_NAME2(XXH_NAMESPACE, XXH64_copyState)
# define XXH32_canonicalFromHash XXH_NAME2(XXH_NAMESPACE, XXH32_canonicalFromHash)
# define XXH64_canonicalFromHash XXH_NAME2(XXH_NAMESPACE, XXH64_canonicalFromHash)
# define XXH32_hashFromCanonical XXH_NAME2(XXH_NAMESPACE, XXH32_hashFromCanonical)
# define XXH64_hashFromCanonical XXH_NAME2(XXH_NAMESPACE, XXH64_hashFromCanonical)
#endif #endif
@ -140,7 +149,7 @@ regular symbol name will be automatically translated by this header.
***************************************/ ***************************************/
#define XXH_VERSION_MAJOR 0 #define XXH_VERSION_MAJOR 0
#define XXH_VERSION_MINOR 6 #define XXH_VERSION_MINOR 6
#define XXH_VERSION_RELEASE 0 #define XXH_VERSION_RELEASE 2
#define XXH_VERSION_NUMBER (XXH_VERSION_MAJOR *100*100 + XXH_VERSION_MINOR *100 + XXH_VERSION_RELEASE) #define XXH_VERSION_NUMBER (XXH_VERSION_MAJOR *100*100 + XXH_VERSION_MINOR *100 + XXH_VERSION_RELEASE)
XXH_PUBLIC_API unsigned XXH_versionNumber (void); XXH_PUBLIC_API unsigned XXH_versionNumber (void);
@ -163,7 +172,7 @@ XXH32() :
XXH64() : XXH64() :
Calculate the 64-bits hash of sequence of length "len" stored at memory address "input". Calculate the 64-bits hash of sequence of length "len" stored at memory address "input".
"seed" can be used to alter the result predictably. "seed" can be used to alter the result predictably.
This function runs faster on 64-bits systems, but slower on 32-bits systems (see benchmark). This function runs 2x faster on 64-bits systems, but slower on 32-bits systems (see benchmark).
*/ */
@ -173,8 +182,7 @@ XXH64() :
typedef struct XXH32_state_s XXH32_state_t; /* incomplete type */ typedef struct XXH32_state_s XXH32_state_t; /* incomplete type */
typedef struct XXH64_state_s XXH64_state_t; /* incomplete type */ typedef struct XXH64_state_s XXH64_state_t; /* incomplete type */
/*! Dynamic allocation of states /*! State allocation, compatible with dynamic libraries */
Compatible with dynamic libraries */
XXH_PUBLIC_API XXH32_state_t* XXH32_createState(void); XXH_PUBLIC_API XXH32_state_t* XXH32_createState(void);
XXH_PUBLIC_API XXH_errorcode XXH32_freeState(XXH32_state_t* statePtr); XXH_PUBLIC_API XXH_errorcode XXH32_freeState(XXH32_state_t* statePtr);
@ -193,28 +201,40 @@ XXH_PUBLIC_API XXH_errorcode XXH64_reset (XXH64_state_t* statePtr, unsigned lon
XXH_PUBLIC_API XXH_errorcode XXH64_update (XXH64_state_t* statePtr, const void* input, size_t length); XXH_PUBLIC_API XXH_errorcode XXH64_update (XXH64_state_t* statePtr, const void* input, size_t length);
XXH_PUBLIC_API XXH64_hash_t XXH64_digest (const XXH64_state_t* statePtr); XXH_PUBLIC_API XXH64_hash_t XXH64_digest (const XXH64_state_t* statePtr);
/*! /*
These functions generate the xxHash of an input provided in multiple segments, These functions generate the xxHash of an input provided in multiple segments.
as opposed to provided as a single block. Note that, for small input, they are slower than single-call functions, due to state management.
For small input, prefer `XXH32()` and `XXH64()` .
XXH state must first be allocated, using either static or dynamic method provided above. XXH state must first be allocated, using XXH*_createState() .
Start a new hash by initializing state with a seed, using XXHnn_reset(). Start a new hash by initializing state with a seed, using XXH*_reset().
Then, feed the hash state by calling XXHnn_update() as many times as necessary. Then, feed the hash state by calling XXH*_update() as many times as necessary.
Obviously, input must be valid, hence allocated and read accessible. Obviously, input must be allocated and read accessible.
The function returns an error code, with 0 meaning OK, and any other value meaning there is an error. The function returns an error code, with 0 meaning OK, and any other value meaning there is an error.
Finally, a hash value can be produced anytime, by using XXHnn_digest(). Finally, a hash value can be produced anytime, by using XXH*_digest().
This function returns the nn-bits hash as an int or long long. This function returns the nn-bits hash as an int or long long.
It's still possible to continue inserting input into the hash state after a digest, It's still possible to continue inserting input into the hash state after a digest,
and later on generate some new hashes, by calling again XXHnn_digest(). and generate some new hashes later on, by calling again XXH*_digest().
When done, free XXH state space if it was allocated dynamically. When done, free XXH state space if it was allocated dynamically.
*/ */
/* **************************
* Utils
****************************/
#if !(defined(__STDC_VERSION__) && (__STDC_VERSION__ >= 199901L)) /* ! C99 */
# define restrict /* disable restrict */
#endif
XXH_PUBLIC_API void XXH32_copyState(XXH32_state_t* restrict dst_state, const XXH32_state_t* restrict src_state);
XXH_PUBLIC_API void XXH64_copyState(XXH64_state_t* restrict dst_state, const XXH64_state_t* restrict src_state);
/* ************************** /* **************************
* Canonical representation * Canonical representation
****************************/ ****************************/
@ -227,43 +247,55 @@ XXH_PUBLIC_API void XXH64_canonicalFromHash(XXH64_canonical_t* dst, XXH64_hash_t
XXH_PUBLIC_API XXH32_hash_t XXH32_hashFromCanonical(const XXH32_canonical_t* src); XXH_PUBLIC_API XXH32_hash_t XXH32_hashFromCanonical(const XXH32_canonical_t* src);
XXH_PUBLIC_API XXH64_hash_t XXH64_hashFromCanonical(const XXH64_canonical_t* src); XXH_PUBLIC_API XXH64_hash_t XXH64_hashFromCanonical(const XXH64_canonical_t* src);
/*! Default result type for XXH functions are primitive unsigned 32 and 64 bits. /* Default result type for XXH functions are primitive unsigned 32 and 64 bits.
* The canonical representation uses human-readable write convention, aka big-endian (large digits first). * The canonical representation uses human-readable write convention, aka big-endian (large digits first).
* These functions allow transformation of hash result into and from its canonical format. * These functions allow transformation of hash result into and from its canonical format.
* This way, hash values can be written into a file / memory, and remain comparable on different systems and programs. * This way, hash values can be written into a file / memory, and remain comparable on different systems and programs.
*/ */
#ifdef XXH_STATIC_LINKING_ONLY #ifdef XXH_STATIC_LINKING_ONLY
/* This part contains definition which shall only be used with static linking. /* ================================================================================================
The prototypes / types defined here are not guaranteed to remain stable. This section contains definitions which are not guaranteed to remain stable.
They could change in a future version, becoming incompatible with a different version of the library */ They may change in future versions, becoming incompatible with a different version of the library.
They shall only be used with static linking.
Never use these definitions in association with dynamic linking !
=================================================================================================== */
/* These definitions are only meant to allow allocation of XXH state
statically, on stack, or in a struct for example.
Do not use members directly. */
struct XXH32_state_s { struct XXH32_state_s {
unsigned long long total_len; unsigned total_len_32;
unsigned seed; unsigned large_len;
unsigned v1; unsigned v1;
unsigned v2; unsigned v2;
unsigned v3; unsigned v3;
unsigned v4; unsigned v4;
unsigned mem32[4]; /* buffer defined as U32 for alignment */ unsigned mem32[4]; /* buffer defined as U32 for alignment */
unsigned memsize; unsigned memsize;
unsigned reserved; /* never read nor write, will be removed in a future version */
}; /* typedef'd to XXH32_state_t */ }; /* typedef'd to XXH32_state_t */
struct XXH64_state_s { struct XXH64_state_s {
unsigned long long total_len; unsigned long long total_len;
unsigned long long seed;
unsigned long long v1; unsigned long long v1;
unsigned long long v2; unsigned long long v2;
unsigned long long v3; unsigned long long v3;
unsigned long long v4; unsigned long long v4;
unsigned long long mem64[4]; /* buffer defined as U64 for alignment */ unsigned long long mem64[4]; /* buffer defined as U64 for alignment */
unsigned memsize; unsigned memsize;
unsigned reserved[2]; /* never read nor write, will be removed in a future version */
}; /* typedef'd to XXH64_state_t */ }; /* typedef'd to XXH64_state_t */
#endif # ifdef XXH_PRIVATE_API
# include "xxhash.c" /* include xxhash functions as `static`, for inlining */
# endif
#endif /* XXH_STATIC_LINKING_ONLY */
#if defined (__cplusplus) #if defined (__cplusplus)