diff options
Diffstat (limited to 'lib/zstd/compress/zstd_ldm.c')
| -rw-r--r-- | lib/zstd/compress/zstd_ldm.c | 102 | 
1 files changed, 62 insertions, 40 deletions
| diff --git a/lib/zstd/compress/zstd_ldm.c b/lib/zstd/compress/zstd_ldm.c index dd86fc83e7dd..54eefad9cae6 100644 --- a/lib/zstd/compress/zstd_ldm.c +++ b/lib/zstd/compress/zstd_ldm.c @@ -1,5 +1,6 @@ +// SPDX-License-Identifier: GPL-2.0+ OR BSD-3-Clause  /* - * Copyright (c) Yann Collet, Facebook, Inc. + * Copyright (c) Meta Platforms, Inc. and affiliates.   * All rights reserved.   *   * This source code is licensed under both the BSD-style license (found in the @@ -16,7 +17,7 @@  #include "zstd_double_fast.h"   /* ZSTD_fillDoubleHashTable() */  #include "zstd_ldm_geartab.h" -#define LDM_BUCKET_SIZE_LOG 3 +#define LDM_BUCKET_SIZE_LOG 4  #define LDM_MIN_MATCH_LENGTH 64  #define LDM_HASH_RLOG 7 @@ -133,21 +134,35 @@ done:  }  void ZSTD_ldm_adjustParameters(ldmParams_t* params, -                               ZSTD_compressionParameters const* cParams) +                        const ZSTD_compressionParameters* cParams)  {      params->windowLog = cParams->windowLog;      ZSTD_STATIC_ASSERT(LDM_BUCKET_SIZE_LOG <= ZSTD_LDM_BUCKETSIZELOG_MAX);      DEBUGLOG(4, "ZSTD_ldm_adjustParameters"); -    if (!params->bucketSizeLog) params->bucketSizeLog = LDM_BUCKET_SIZE_LOG; -    if (!params->minMatchLength) params->minMatchLength = LDM_MIN_MATCH_LENGTH; +    if (params->hashRateLog == 0) { +        if (params->hashLog > 0) { +            /* if params->hashLog is set, derive hashRateLog from it */ +            assert(params->hashLog <= ZSTD_HASHLOG_MAX); +            if (params->windowLog > params->hashLog) { +                params->hashRateLog = params->windowLog - params->hashLog; +            } +        } else { +            assert(1 <= (int)cParams->strategy && (int)cParams->strategy <= 9); +            /* mapping from [fast, rate7] to [btultra2, rate4] */ +            params->hashRateLog = 7 - (cParams->strategy/3); +        } +    }      if (params->hashLog == 0) { -        params->hashLog = MAX(ZSTD_HASHLOG_MIN, params->windowLog - LDM_HASH_RLOG); -        assert(params->hashLog <= ZSTD_HASHLOG_MAX); +        params->hashLog = BOUNDED(ZSTD_HASHLOG_MIN, params->windowLog - params->hashRateLog, ZSTD_HASHLOG_MAX);      } -    if (params->hashRateLog == 0) { -        params->hashRateLog = params->windowLog < params->hashLog -                                   ? 0 -                                   : params->windowLog - params->hashLog; +    if (params->minMatchLength == 0) { +        params->minMatchLength = LDM_MIN_MATCH_LENGTH; +        if (cParams->strategy >= ZSTD_btultra) +            params->minMatchLength /= 2; +    } +    if (params->bucketSizeLog==0) { +        assert(1 <= (int)cParams->strategy && (int)cParams->strategy <= 9); +        params->bucketSizeLog = BOUNDED(LDM_BUCKET_SIZE_LOG, (U32)cParams->strategy, ZSTD_LDM_BUCKETSIZELOG_MAX);      }      params->bucketSizeLog = MIN(params->bucketSizeLog, params->hashLog);  } @@ -170,22 +185,22 @@ size_t ZSTD_ldm_getMaxNbSeq(ldmParams_t params, size_t maxChunkSize)  /* ZSTD_ldm_getBucket() :   *  Returns a pointer to the start of the bucket associated with hash. */  static ldmEntry_t* ZSTD_ldm_getBucket( -        ldmState_t* ldmState, size_t hash, ldmParams_t const ldmParams) +        const ldmState_t* ldmState, size_t hash, U32 const bucketSizeLog)  { -    return ldmState->hashTable + (hash << ldmParams.bucketSizeLog); +    return ldmState->hashTable + (hash << bucketSizeLog);  }  /* ZSTD_ldm_insertEntry() :   *  Insert the entry with corresponding hash into the hash table */  static void ZSTD_ldm_insertEntry(ldmState_t* ldmState,                                   size_t const hash, const ldmEntry_t entry, -                                 ldmParams_t const ldmParams) +                                 U32 const bucketSizeLog)  {      BYTE* const pOffset = ldmState->bucketOffsets + hash;      unsigned const offset = *pOffset; -    *(ZSTD_ldm_getBucket(ldmState, hash, ldmParams) + offset) = entry; -    *pOffset = (BYTE)((offset + 1) & ((1u << ldmParams.bucketSizeLog) - 1)); +    *(ZSTD_ldm_getBucket(ldmState, hash, bucketSizeLog) + offset) = entry; +    *pOffset = (BYTE)((offset + 1) & ((1u << bucketSizeLog) - 1));  } @@ -234,7 +249,7 @@ static size_t ZSTD_ldm_countBackwardsMatch_2segments(   *   *  The tables for the other strategies are filled within their   *  block compressors. */ -static size_t ZSTD_ldm_fillFastTables(ZSTD_matchState_t* ms, +static size_t ZSTD_ldm_fillFastTables(ZSTD_MatchState_t* ms,                                        void const* end)  {      const BYTE* const iend = (const BYTE*)end; @@ -242,11 +257,15 @@ static size_t ZSTD_ldm_fillFastTables(ZSTD_matchState_t* ms,      switch(ms->cParams.strategy)      {      case ZSTD_fast: -        ZSTD_fillHashTable(ms, iend, ZSTD_dtlm_fast); +        ZSTD_fillHashTable(ms, iend, ZSTD_dtlm_fast, ZSTD_tfp_forCCtx);          break;      case ZSTD_dfast: -        ZSTD_fillDoubleHashTable(ms, iend, ZSTD_dtlm_fast); +#ifndef ZSTD_EXCLUDE_DFAST_BLOCK_COMPRESSOR +        ZSTD_fillDoubleHashTable(ms, iend, ZSTD_dtlm_fast, ZSTD_tfp_forCCtx); +#else +        assert(0); /* shouldn't be called: cparams should've been adjusted. */ +#endif          break;      case ZSTD_greedy: @@ -269,7 +288,8 @@ void ZSTD_ldm_fillHashTable(              const BYTE* iend, ldmParams_t const* params)  {      U32 const minMatchLength = params->minMatchLength; -    U32 const hBits = params->hashLog - params->bucketSizeLog; +    U32 const bucketSizeLog = params->bucketSizeLog; +    U32 const hBits = params->hashLog - bucketSizeLog;      BYTE const* const base = ldmState->window.base;      BYTE const* const istart = ip;      ldmRollingHashState_t hashState; @@ -284,7 +304,7 @@ void ZSTD_ldm_fillHashTable(          unsigned n;          numSplits = 0; -        hashed = ZSTD_ldm_gear_feed(&hashState, ip, iend - ip, splits, &numSplits); +        hashed = ZSTD_ldm_gear_feed(&hashState, ip, (size_t)(iend - ip), splits, &numSplits);          for (n = 0; n < numSplits; n++) {              if (ip + splits[n] >= istart + minMatchLength) { @@ -295,7 +315,7 @@ void ZSTD_ldm_fillHashTable(                  entry.offset = (U32)(split - base);                  entry.checksum = (U32)(xxhash >> 32); -                ZSTD_ldm_insertEntry(ldmState, hash, entry, *params); +                ZSTD_ldm_insertEntry(ldmState, hash, entry, params->bucketSizeLog);              }          } @@ -309,7 +329,7 @@ void ZSTD_ldm_fillHashTable(   *  Sets cctx->nextToUpdate to a position corresponding closer to anchor   *  if it is far way   *  (after a long match, only update tables a limited amount). */ -static void ZSTD_ldm_limitTableUpdate(ZSTD_matchState_t* ms, const BYTE* anchor) +static void ZSTD_ldm_limitTableUpdate(ZSTD_MatchState_t* ms, const BYTE* anchor)  {      U32 const curr = (U32)(anchor - ms->window.base);      if (curr > ms->nextToUpdate + 1024) { @@ -318,8 +338,10 @@ static void ZSTD_ldm_limitTableUpdate(ZSTD_matchState_t* ms, const BYTE* anchor)      }  } -static size_t ZSTD_ldm_generateSequences_internal( -        ldmState_t* ldmState, rawSeqStore_t* rawSeqStore, +static +ZSTD_ALLOW_POINTER_OVERFLOW_ATTR +size_t ZSTD_ldm_generateSequences_internal( +        ldmState_t* ldmState, RawSeqStore_t* rawSeqStore,          ldmParams_t const* params, void const* src, size_t srcSize)  {      /* LDM parameters */ @@ -373,7 +395,7 @@ static size_t ZSTD_ldm_generateSequences_internal(              candidates[n].split = split;              candidates[n].hash = hash;              candidates[n].checksum = (U32)(xxhash >> 32); -            candidates[n].bucket = ZSTD_ldm_getBucket(ldmState, hash, *params); +            candidates[n].bucket = ZSTD_ldm_getBucket(ldmState, hash, params->bucketSizeLog);              PREFETCH_L1(candidates[n].bucket);          } @@ -396,7 +418,7 @@ static size_t ZSTD_ldm_generateSequences_internal(               * the previous one, we merely register it in the hash table and               * move on */              if (split < anchor) { -                ZSTD_ldm_insertEntry(ldmState, hash, newEntry, *params); +                ZSTD_ldm_insertEntry(ldmState, hash, newEntry, params->bucketSizeLog);                  continue;              } @@ -443,7 +465,7 @@ static size_t ZSTD_ldm_generateSequences_internal(              /* No match found -- insert an entry into the hash table               * and process the next candidate match */              if (bestEntry == NULL) { -                ZSTD_ldm_insertEntry(ldmState, hash, newEntry, *params); +                ZSTD_ldm_insertEntry(ldmState, hash, newEntry, params->bucketSizeLog);                  continue;              } @@ -464,7 +486,7 @@ static size_t ZSTD_ldm_generateSequences_internal(              /* Insert the current entry into the hash table --- it must be               * done after the previous block to avoid clobbering bestEntry */ -            ZSTD_ldm_insertEntry(ldmState, hash, newEntry, *params); +            ZSTD_ldm_insertEntry(ldmState, hash, newEntry, params->bucketSizeLog);              anchor = split + forwardMatchLength; @@ -503,7 +525,7 @@ static void ZSTD_ldm_reduceTable(ldmEntry_t* const table, U32 const size,  }  size_t ZSTD_ldm_generateSequences( -        ldmState_t* ldmState, rawSeqStore_t* sequences, +        ldmState_t* ldmState, RawSeqStore_t* sequences,          ldmParams_t const* params, void const* src, size_t srcSize)  {      U32 const maxDist = 1U << params->windowLog; @@ -549,7 +571,7 @@ size_t ZSTD_ldm_generateSequences(           * the window through early invalidation.           * TODO: * Test the chunk size.           *       * Try invalidation after the sequence generation and test the -         *         the offset against maxDist directly. +         *         offset against maxDist directly.           *           * NOTE: Because of dictionaries + sequence splitting we MUST make sure           * that any offset used is valid at the END of the sequence, since it may @@ -580,7 +602,7 @@ size_t ZSTD_ldm_generateSequences(  }  void -ZSTD_ldm_skipSequences(rawSeqStore_t* rawSeqStore, size_t srcSize, U32 const minMatch) +ZSTD_ldm_skipSequences(RawSeqStore_t* rawSeqStore, size_t srcSize, U32 const minMatch)  {      while (srcSize > 0 && rawSeqStore->pos < rawSeqStore->size) {          rawSeq* seq = rawSeqStore->seq + rawSeqStore->pos; @@ -616,7 +638,7 @@ ZSTD_ldm_skipSequences(rawSeqStore_t* rawSeqStore, size_t srcSize, U32 const min   * Returns the current sequence to handle, or if the rest of the block should   * be literals, it returns a sequence with offset == 0.   */ -static rawSeq maybeSplitSequence(rawSeqStore_t* rawSeqStore, +static rawSeq maybeSplitSequence(RawSeqStore_t* rawSeqStore,                                   U32 const remaining, U32 const minMatch)  {      rawSeq sequence = rawSeqStore->seq[rawSeqStore->pos]; @@ -640,7 +662,7 @@ static rawSeq maybeSplitSequence(rawSeqStore_t* rawSeqStore,      return sequence;  } -void ZSTD_ldm_skipRawSeqStoreBytes(rawSeqStore_t* rawSeqStore, size_t nbBytes) { +void ZSTD_ldm_skipRawSeqStoreBytes(RawSeqStore_t* rawSeqStore, size_t nbBytes) {      U32 currPos = (U32)(rawSeqStore->posInSequence + nbBytes);      while (currPos && rawSeqStore->pos < rawSeqStore->size) {          rawSeq currSeq = rawSeqStore->seq[rawSeqStore->pos]; @@ -657,14 +679,14 @@ void ZSTD_ldm_skipRawSeqStoreBytes(rawSeqStore_t* rawSeqStore, size_t nbBytes) {      }  } -size_t ZSTD_ldm_blockCompress(rawSeqStore_t* rawSeqStore, -    ZSTD_matchState_t* ms, seqStore_t* seqStore, U32 rep[ZSTD_REP_NUM], -    ZSTD_paramSwitch_e useRowMatchFinder, +size_t ZSTD_ldm_blockCompress(RawSeqStore_t* rawSeqStore, +    ZSTD_MatchState_t* ms, SeqStore_t* seqStore, U32 rep[ZSTD_REP_NUM], +    ZSTD_ParamSwitch_e useRowMatchFinder,      void const* src, size_t srcSize)  {      const ZSTD_compressionParameters* const cParams = &ms->cParams;      unsigned const minMatch = cParams->minMatch; -    ZSTD_blockCompressor const blockCompressor = +    ZSTD_BlockCompressor_f const blockCompressor =          ZSTD_selectBlockCompressor(cParams->strategy, useRowMatchFinder, ZSTD_matchState_dictMode(ms));      /* Input bounds */      BYTE const* const istart = (BYTE const*)src; @@ -689,7 +711,6 @@ size_t ZSTD_ldm_blockCompress(rawSeqStore_t* rawSeqStore,          /* maybeSplitSequence updates rawSeqStore->pos */          rawSeq const sequence = maybeSplitSequence(rawSeqStore,                                                     (U32)(iend - ip), minMatch); -        int i;          /* End signal */          if (sequence.offset == 0)              break; @@ -702,6 +723,7 @@ size_t ZSTD_ldm_blockCompress(rawSeqStore_t* rawSeqStore,          /* Run the block compressor */          DEBUGLOG(5, "pos %u : calling block compressor on segment of size %u", (unsigned)(ip-istart), sequence.litLength);          { +            int i;              size_t const newLitLength =                  blockCompressor(ms, seqStore, rep, ip, sequence.litLength);              ip += sequence.litLength; @@ -711,7 +733,7 @@ size_t ZSTD_ldm_blockCompress(rawSeqStore_t* rawSeqStore,              rep[0] = sequence.offset;              /* Store the sequence */              ZSTD_storeSeq(seqStore, newLitLength, ip - newLitLength, iend, -                          STORE_OFFSET(sequence.offset), +                          OFFSET_TO_OFFBASE(sequence.offset),                            sequence.matchLength);              ip += sequence.matchLength;          } | 
