mirror of
https://github.com/facebook/zstd.git
synced 2025-10-05 00:07:15 -04:00
* First building commit with sample matchfinder * Set up ZSTD_externalMatchCtx struct * move seqBuffer to ZSTD_Sequence* * support non-contiguous dictionary * clean up parens * add clearExternalMatchfinder, handle allocation errors * Add useExternalMatchfinder cParam * validate useExternalMatchfinder cParam * Disable LDM + external matchfinder * Check for static CCtx * Validate mState and mStateDestructor * Improve LDM check to cover both branches * Error API with optional fallback * handle RLE properly for external matchfinder * nit * Move to a CDict-like model for resource ownership * Add hidden useExternalMatchfinder bool to CCtx_params_s * Eliminate malloc, move to cwksp allocation * Handle CCtx reset properly * Ensure seqStore has enough space for external sequences * fix capitalization * Add DEBUGLOG statements * Add compressionLevel param to matchfinder API * fix c99 issues and add a param combination error code * nits * Test external matchfinder API * C90 compat for simpleExternalMatchFinder * Fix some @nocommits and an ASAN bug * nit * nit * nits * forward declare copySequencesToSeqStore functions in zstd_compress_internal.h * nit * nit * nits * Update copyright headers * Fix CMake zstreamtest build * Fix copyright headers (again) * typo * Add externalMatchfinder demo program to make contrib * Reduce memory consumption for small blockSize * ZSTD_postProcessExternalMatchFinderResult nits * test sum(matchlen) + sum(litlen) == srcSize in debug builds * refExternalMatchFinder -> registerExternalMatchFinder * C90 nit * zstreamtest nits * contrib nits * contrib nits * allow block splitter + external matchfinder, refactor * add windowSize param * add contrib/externalMatchfinder/README.md * docs * go back to old RLE heuristic because of the first block issue * fix initializer element is not a constant expression * ref contrib from zstd.h * extremely pedantic compiler warning fix, meson fix, typo fix * Additional docs on API limitations * minor nits * Refactor maxNbSeq calculation into a helper function * Fix copyright
81 lines
2.3 KiB
C
81 lines
2.3 KiB
C
/*
|
|
* Copyright (c) Yann Collet, Meta Platforms, Inc.
|
|
* All rights reserved.
|
|
*
|
|
* This source code is licensed under both the BSD-style license (found in the
|
|
* LICENSE file in the root directory of this source tree) and the GPLv2 (found
|
|
* in the COPYING file in the root directory of this source tree).
|
|
* You may select, at your option, one of the above-listed licenses.
|
|
*/
|
|
|
|
#include "zstd_compress_internal.h"
|
|
#include "matchfinder.h"
|
|
|
|
#define HSIZE 1024
|
|
static U32 const HLOG = 10;
|
|
static U32 const MLS = 4;
|
|
static U32 const BADIDX = 0xffffffff;
|
|
|
|
size_t simpleExternalMatchFinder(
|
|
void* externalMatchState,
|
|
ZSTD_Sequence* outSeqs, size_t outSeqsCapacity,
|
|
const void* src, size_t srcSize,
|
|
const void* dict, size_t dictSize,
|
|
int compressionLevel,
|
|
size_t windowSize
|
|
) {
|
|
const BYTE* const istart = (const BYTE*)src;
|
|
const BYTE* const iend = istart + srcSize;
|
|
const BYTE* ip = istart;
|
|
const BYTE* anchor = istart;
|
|
size_t seqCount = 0;
|
|
U32 hashTable[HSIZE];
|
|
|
|
(void)externalMatchState;
|
|
(void)dict;
|
|
(void)dictSize;
|
|
(void)outSeqsCapacity;
|
|
(void)compressionLevel;
|
|
|
|
{ int i;
|
|
for (i=0; i < HSIZE; i++) {
|
|
hashTable[i] = BADIDX;
|
|
} }
|
|
|
|
while (ip + MLS < iend) {
|
|
size_t const hash = ZSTD_hashPtr(ip, HLOG, MLS);
|
|
U32 const matchIndex = hashTable[hash];
|
|
hashTable[hash] = (U32)(ip - istart);
|
|
|
|
if (matchIndex != BADIDX) {
|
|
const BYTE* const match = istart + matchIndex;
|
|
U32 const matchLen = (U32)ZSTD_count(ip, match, iend);
|
|
if (matchLen >= ZSTD_MINMATCH_MIN) {
|
|
U32 const litLen = (U32)(ip - anchor);
|
|
U32 const offset = (U32)(ip - match);
|
|
ZSTD_Sequence const seq = {
|
|
offset, litLen, matchLen, 0
|
|
};
|
|
|
|
/* Note: it's crucial to stay within the window size! */
|
|
if (offset <= windowSize) {
|
|
outSeqs[seqCount++] = seq;
|
|
ip += matchLen;
|
|
anchor = ip;
|
|
continue;
|
|
}
|
|
}
|
|
}
|
|
|
|
ip++;
|
|
}
|
|
|
|
{ ZSTD_Sequence const finalSeq = {
|
|
0, (U32)(iend - anchor), 0, 0
|
|
};
|
|
outSeqs[seqCount++] = finalSeq;
|
|
}
|
|
|
|
return seqCount;
|
|
}
|