Merge pull request #766 from terrelln/real-block-split
[libzstd] Pull optimal parser state out of seqStore_t
This commit is contained in:
commit
77d67fb167
@ -215,20 +215,6 @@ MEM_STATIC void ZSTD_wildcopy_e(void* dst, const void* src, void* dstEnd) /* s
|
|||||||
*********************************************/
|
*********************************************/
|
||||||
typedef struct ZSTD_stats_s ZSTD_stats_t;
|
typedef struct ZSTD_stats_s ZSTD_stats_t;
|
||||||
|
|
||||||
typedef struct {
|
|
||||||
U32 off;
|
|
||||||
U32 len;
|
|
||||||
} ZSTD_match_t;
|
|
||||||
|
|
||||||
typedef struct {
|
|
||||||
U32 price;
|
|
||||||
U32 off;
|
|
||||||
U32 mlen;
|
|
||||||
U32 litlen;
|
|
||||||
U32 rep[ZSTD_REP_NUM];
|
|
||||||
} ZSTD_optimal_t;
|
|
||||||
|
|
||||||
|
|
||||||
typedef struct seqDef_s {
|
typedef struct seqDef_s {
|
||||||
U32 offset;
|
U32 offset;
|
||||||
U16 litLength;
|
U16 litLength;
|
||||||
@ -248,13 +234,29 @@ typedef struct {
|
|||||||
U32 longLengthPos;
|
U32 longLengthPos;
|
||||||
U32 rep[ZSTD_REP_NUM];
|
U32 rep[ZSTD_REP_NUM];
|
||||||
U32 repToConfirm[ZSTD_REP_NUM];
|
U32 repToConfirm[ZSTD_REP_NUM];
|
||||||
/* opt */
|
} seqStore_t;
|
||||||
ZSTD_optimal_t* priceTable;
|
|
||||||
ZSTD_match_t* matchTable;
|
typedef struct {
|
||||||
U32* matchLengthFreq;
|
U32 off;
|
||||||
U32* litLengthFreq;
|
U32 len;
|
||||||
|
} ZSTD_match_t;
|
||||||
|
|
||||||
|
typedef struct {
|
||||||
|
U32 price;
|
||||||
|
U32 off;
|
||||||
|
U32 mlen;
|
||||||
|
U32 litlen;
|
||||||
|
U32 rep[ZSTD_REP_NUM];
|
||||||
|
} ZSTD_optimal_t;
|
||||||
|
|
||||||
|
typedef struct {
|
||||||
U32* litFreq;
|
U32* litFreq;
|
||||||
|
U32* litLengthFreq;
|
||||||
|
U32* matchLengthFreq;
|
||||||
U32* offCodeFreq;
|
U32* offCodeFreq;
|
||||||
|
ZSTD_match_t* matchTable;
|
||||||
|
ZSTD_optimal_t* priceTable;
|
||||||
|
|
||||||
U32 matchLengthSum;
|
U32 matchLengthSum;
|
||||||
U32 matchSum;
|
U32 matchSum;
|
||||||
U32 litLengthSum;
|
U32 litLengthSum;
|
||||||
@ -270,7 +272,7 @@ typedef struct {
|
|||||||
U32 cachedPrice;
|
U32 cachedPrice;
|
||||||
U32 cachedLitLength;
|
U32 cachedLitLength;
|
||||||
const BYTE* cachedLiterals;
|
const BYTE* cachedLiterals;
|
||||||
} seqStore_t;
|
} optState_t;
|
||||||
|
|
||||||
typedef struct {
|
typedef struct {
|
||||||
U32 hufCTable[HUF_CTABLE_SIZE_U32(255)];
|
U32 hufCTable[HUF_CTABLE_SIZE_U32(255)];
|
||||||
|
@ -96,6 +96,7 @@ struct ZSTD_CCtx_s {
|
|||||||
size_t staticSize;
|
size_t staticSize;
|
||||||
|
|
||||||
seqStore_t seqStore; /* sequences storage ptrs */
|
seqStore_t seqStore; /* sequences storage ptrs */
|
||||||
|
optState_t optState;
|
||||||
U32* hashTable;
|
U32* hashTable;
|
||||||
U32* hashTable3;
|
U32* hashTable3;
|
||||||
U32* chainTable;
|
U32* chainTable;
|
||||||
@ -595,7 +596,7 @@ static size_t ZSTD_continueCCtx(ZSTD_CCtx* cctx, ZSTD_parameters params, U64 ple
|
|||||||
cctx->dictID = 0;
|
cctx->dictID = 0;
|
||||||
cctx->loadedDictEnd = 0;
|
cctx->loadedDictEnd = 0;
|
||||||
{ int i; for (i=0; i<ZSTD_REP_NUM; i++) cctx->seqStore.rep[i] = repStartValue[i]; }
|
{ int i; for (i=0; i<ZSTD_REP_NUM; i++) cctx->seqStore.rep[i] = repStartValue[i]; }
|
||||||
cctx->seqStore.litLengthSum = 0; /* force reset of btopt stats */
|
cctx->optState.litLengthSum = 0; /* force reset of btopt stats */
|
||||||
XXH64_reset(&cctx->xxhState, 0);
|
XXH64_reset(&cctx->xxhState, 0);
|
||||||
return 0;
|
return 0;
|
||||||
}
|
}
|
||||||
@ -694,7 +695,7 @@ static size_t ZSTD_resetCCtx_internal(ZSTD_CCtx* zc,
|
|||||||
zc->lowLimit = 0;
|
zc->lowLimit = 0;
|
||||||
{ int i; for (i=0; i<ZSTD_REP_NUM; i++) zc->seqStore.rep[i] = repStartValue[i]; }
|
{ int i; for (i=0; i<ZSTD_REP_NUM; i++) zc->seqStore.rep[i] = repStartValue[i]; }
|
||||||
zc->hashLog3 = hashLog3;
|
zc->hashLog3 = hashLog3;
|
||||||
zc->seqStore.litLengthSum = 0;
|
zc->optState.litLengthSum = 0;
|
||||||
|
|
||||||
ptr = zc->entropy + 1;
|
ptr = zc->entropy + 1;
|
||||||
|
|
||||||
@ -702,15 +703,15 @@ static size_t ZSTD_resetCCtx_internal(ZSTD_CCtx* zc,
|
|||||||
if ((params.cParams.strategy == ZSTD_btopt) || (params.cParams.strategy == ZSTD_btultra)) {
|
if ((params.cParams.strategy == ZSTD_btopt) || (params.cParams.strategy == ZSTD_btultra)) {
|
||||||
DEBUGLOG(5, "reserving optimal parser space");
|
DEBUGLOG(5, "reserving optimal parser space");
|
||||||
assert(((size_t)ptr & 3) == 0); /* ensure ptr is properly aligned */
|
assert(((size_t)ptr & 3) == 0); /* ensure ptr is properly aligned */
|
||||||
zc->seqStore.litFreq = (U32*)ptr;
|
zc->optState.litFreq = (U32*)ptr;
|
||||||
zc->seqStore.litLengthFreq = zc->seqStore.litFreq + (1<<Litbits);
|
zc->optState.litLengthFreq = zc->optState.litFreq + (1<<Litbits);
|
||||||
zc->seqStore.matchLengthFreq = zc->seqStore.litLengthFreq + (MaxLL+1);
|
zc->optState.matchLengthFreq = zc->optState.litLengthFreq + (MaxLL+1);
|
||||||
zc->seqStore.offCodeFreq = zc->seqStore.matchLengthFreq + (MaxML+1);
|
zc->optState.offCodeFreq = zc->optState.matchLengthFreq + (MaxML+1);
|
||||||
ptr = zc->seqStore.offCodeFreq + (MaxOff+1);
|
ptr = zc->optState.offCodeFreq + (MaxOff+1);
|
||||||
zc->seqStore.matchTable = (ZSTD_match_t*)ptr;
|
zc->optState.matchTable = (ZSTD_match_t*)ptr;
|
||||||
ptr = zc->seqStore.matchTable + ZSTD_OPT_NUM+1;
|
ptr = zc->optState.matchTable + ZSTD_OPT_NUM+1;
|
||||||
zc->seqStore.priceTable = (ZSTD_optimal_t*)ptr;
|
zc->optState.priceTable = (ZSTD_optimal_t*)ptr;
|
||||||
ptr = zc->seqStore.priceTable + ZSTD_OPT_NUM+1;
|
ptr = zc->optState.priceTable + ZSTD_OPT_NUM+1;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* table Space */
|
/* table Space */
|
||||||
|
@ -22,173 +22,173 @@
|
|||||||
/*-*************************************
|
/*-*************************************
|
||||||
* Price functions for optimal parser
|
* Price functions for optimal parser
|
||||||
***************************************/
|
***************************************/
|
||||||
FORCE_INLINE void ZSTD_setLog2Prices(seqStore_t* ssPtr)
|
FORCE_INLINE void ZSTD_setLog2Prices(optState_t* optPtr)
|
||||||
{
|
{
|
||||||
ssPtr->log2matchLengthSum = ZSTD_highbit32(ssPtr->matchLengthSum+1);
|
optPtr->log2matchLengthSum = ZSTD_highbit32(optPtr->matchLengthSum+1);
|
||||||
ssPtr->log2litLengthSum = ZSTD_highbit32(ssPtr->litLengthSum+1);
|
optPtr->log2litLengthSum = ZSTD_highbit32(optPtr->litLengthSum+1);
|
||||||
ssPtr->log2litSum = ZSTD_highbit32(ssPtr->litSum+1);
|
optPtr->log2litSum = ZSTD_highbit32(optPtr->litSum+1);
|
||||||
ssPtr->log2offCodeSum = ZSTD_highbit32(ssPtr->offCodeSum+1);
|
optPtr->log2offCodeSum = ZSTD_highbit32(optPtr->offCodeSum+1);
|
||||||
ssPtr->factor = 1 + ((ssPtr->litSum>>5) / ssPtr->litLengthSum) + ((ssPtr->litSum<<1) / (ssPtr->litSum + ssPtr->matchSum));
|
optPtr->factor = 1 + ((optPtr->litSum>>5) / optPtr->litLengthSum) + ((optPtr->litSum<<1) / (optPtr->litSum + optPtr->matchSum));
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
MEM_STATIC void ZSTD_rescaleFreqs(seqStore_t* ssPtr, const BYTE* src, size_t srcSize)
|
MEM_STATIC void ZSTD_rescaleFreqs(optState_t* optPtr, const BYTE* src, size_t srcSize)
|
||||||
{
|
{
|
||||||
unsigned u;
|
unsigned u;
|
||||||
|
|
||||||
ssPtr->cachedLiterals = NULL;
|
optPtr->cachedLiterals = NULL;
|
||||||
ssPtr->cachedPrice = ssPtr->cachedLitLength = 0;
|
optPtr->cachedPrice = optPtr->cachedLitLength = 0;
|
||||||
ssPtr->staticPrices = 0;
|
optPtr->staticPrices = 0;
|
||||||
|
|
||||||
if (ssPtr->litLengthSum == 0) {
|
if (optPtr->litLengthSum == 0) {
|
||||||
if (srcSize <= 1024) ssPtr->staticPrices = 1;
|
if (srcSize <= 1024) optPtr->staticPrices = 1;
|
||||||
|
|
||||||
assert(ssPtr->litFreq!=NULL);
|
assert(optPtr->litFreq!=NULL);
|
||||||
for (u=0; u<=MaxLit; u++)
|
for (u=0; u<=MaxLit; u++)
|
||||||
ssPtr->litFreq[u] = 0;
|
optPtr->litFreq[u] = 0;
|
||||||
for (u=0; u<srcSize; u++)
|
for (u=0; u<srcSize; u++)
|
||||||
ssPtr->litFreq[src[u]]++;
|
optPtr->litFreq[src[u]]++;
|
||||||
|
|
||||||
ssPtr->litSum = 0;
|
optPtr->litSum = 0;
|
||||||
ssPtr->litLengthSum = MaxLL+1;
|
optPtr->litLengthSum = MaxLL+1;
|
||||||
ssPtr->matchLengthSum = MaxML+1;
|
optPtr->matchLengthSum = MaxML+1;
|
||||||
ssPtr->offCodeSum = (MaxOff+1);
|
optPtr->offCodeSum = (MaxOff+1);
|
||||||
ssPtr->matchSum = (ZSTD_LITFREQ_ADD<<Litbits);
|
optPtr->matchSum = (ZSTD_LITFREQ_ADD<<Litbits);
|
||||||
|
|
||||||
for (u=0; u<=MaxLit; u++) {
|
for (u=0; u<=MaxLit; u++) {
|
||||||
ssPtr->litFreq[u] = 1 + (ssPtr->litFreq[u]>>ZSTD_FREQ_DIV);
|
optPtr->litFreq[u] = 1 + (optPtr->litFreq[u]>>ZSTD_FREQ_DIV);
|
||||||
ssPtr->litSum += ssPtr->litFreq[u];
|
optPtr->litSum += optPtr->litFreq[u];
|
||||||
}
|
}
|
||||||
for (u=0; u<=MaxLL; u++)
|
for (u=0; u<=MaxLL; u++)
|
||||||
ssPtr->litLengthFreq[u] = 1;
|
optPtr->litLengthFreq[u] = 1;
|
||||||
for (u=0; u<=MaxML; u++)
|
for (u=0; u<=MaxML; u++)
|
||||||
ssPtr->matchLengthFreq[u] = 1;
|
optPtr->matchLengthFreq[u] = 1;
|
||||||
for (u=0; u<=MaxOff; u++)
|
for (u=0; u<=MaxOff; u++)
|
||||||
ssPtr->offCodeFreq[u] = 1;
|
optPtr->offCodeFreq[u] = 1;
|
||||||
} else {
|
} else {
|
||||||
ssPtr->matchLengthSum = 0;
|
optPtr->matchLengthSum = 0;
|
||||||
ssPtr->litLengthSum = 0;
|
optPtr->litLengthSum = 0;
|
||||||
ssPtr->offCodeSum = 0;
|
optPtr->offCodeSum = 0;
|
||||||
ssPtr->matchSum = 0;
|
optPtr->matchSum = 0;
|
||||||
ssPtr->litSum = 0;
|
optPtr->litSum = 0;
|
||||||
|
|
||||||
for (u=0; u<=MaxLit; u++) {
|
for (u=0; u<=MaxLit; u++) {
|
||||||
ssPtr->litFreq[u] = 1 + (ssPtr->litFreq[u]>>(ZSTD_FREQ_DIV+1));
|
optPtr->litFreq[u] = 1 + (optPtr->litFreq[u]>>(ZSTD_FREQ_DIV+1));
|
||||||
ssPtr->litSum += ssPtr->litFreq[u];
|
optPtr->litSum += optPtr->litFreq[u];
|
||||||
}
|
}
|
||||||
for (u=0; u<=MaxLL; u++) {
|
for (u=0; u<=MaxLL; u++) {
|
||||||
ssPtr->litLengthFreq[u] = 1 + (ssPtr->litLengthFreq[u]>>(ZSTD_FREQ_DIV+1));
|
optPtr->litLengthFreq[u] = 1 + (optPtr->litLengthFreq[u]>>(ZSTD_FREQ_DIV+1));
|
||||||
ssPtr->litLengthSum += ssPtr->litLengthFreq[u];
|
optPtr->litLengthSum += optPtr->litLengthFreq[u];
|
||||||
}
|
}
|
||||||
for (u=0; u<=MaxML; u++) {
|
for (u=0; u<=MaxML; u++) {
|
||||||
ssPtr->matchLengthFreq[u] = 1 + (ssPtr->matchLengthFreq[u]>>ZSTD_FREQ_DIV);
|
optPtr->matchLengthFreq[u] = 1 + (optPtr->matchLengthFreq[u]>>ZSTD_FREQ_DIV);
|
||||||
ssPtr->matchLengthSum += ssPtr->matchLengthFreq[u];
|
optPtr->matchLengthSum += optPtr->matchLengthFreq[u];
|
||||||
ssPtr->matchSum += ssPtr->matchLengthFreq[u] * (u + 3);
|
optPtr->matchSum += optPtr->matchLengthFreq[u] * (u + 3);
|
||||||
}
|
}
|
||||||
ssPtr->matchSum *= ZSTD_LITFREQ_ADD;
|
optPtr->matchSum *= ZSTD_LITFREQ_ADD;
|
||||||
for (u=0; u<=MaxOff; u++) {
|
for (u=0; u<=MaxOff; u++) {
|
||||||
ssPtr->offCodeFreq[u] = 1 + (ssPtr->offCodeFreq[u]>>ZSTD_FREQ_DIV);
|
optPtr->offCodeFreq[u] = 1 + (optPtr->offCodeFreq[u]>>ZSTD_FREQ_DIV);
|
||||||
ssPtr->offCodeSum += ssPtr->offCodeFreq[u];
|
optPtr->offCodeSum += optPtr->offCodeFreq[u];
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
ZSTD_setLog2Prices(ssPtr);
|
ZSTD_setLog2Prices(optPtr);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
FORCE_INLINE U32 ZSTD_getLiteralPrice(seqStore_t* ssPtr, U32 litLength, const BYTE* literals)
|
FORCE_INLINE U32 ZSTD_getLiteralPrice(optState_t* optPtr, U32 litLength, const BYTE* literals)
|
||||||
{
|
{
|
||||||
U32 price, u;
|
U32 price, u;
|
||||||
|
|
||||||
if (ssPtr->staticPrices)
|
if (optPtr->staticPrices)
|
||||||
return ZSTD_highbit32((U32)litLength+1) + (litLength*6);
|
return ZSTD_highbit32((U32)litLength+1) + (litLength*6);
|
||||||
|
|
||||||
if (litLength == 0)
|
if (litLength == 0)
|
||||||
return ssPtr->log2litLengthSum - ZSTD_highbit32(ssPtr->litLengthFreq[0]+1);
|
return optPtr->log2litLengthSum - ZSTD_highbit32(optPtr->litLengthFreq[0]+1);
|
||||||
|
|
||||||
/* literals */
|
/* literals */
|
||||||
if (ssPtr->cachedLiterals == literals) {
|
if (optPtr->cachedLiterals == literals) {
|
||||||
U32 const additional = litLength - ssPtr->cachedLitLength;
|
U32 const additional = litLength - optPtr->cachedLitLength;
|
||||||
const BYTE* literals2 = ssPtr->cachedLiterals + ssPtr->cachedLitLength;
|
const BYTE* literals2 = optPtr->cachedLiterals + optPtr->cachedLitLength;
|
||||||
price = ssPtr->cachedPrice + additional * ssPtr->log2litSum;
|
price = optPtr->cachedPrice + additional * optPtr->log2litSum;
|
||||||
for (u=0; u < additional; u++)
|
for (u=0; u < additional; u++)
|
||||||
price -= ZSTD_highbit32(ssPtr->litFreq[literals2[u]]+1);
|
price -= ZSTD_highbit32(optPtr->litFreq[literals2[u]]+1);
|
||||||
ssPtr->cachedPrice = price;
|
optPtr->cachedPrice = price;
|
||||||
ssPtr->cachedLitLength = litLength;
|
optPtr->cachedLitLength = litLength;
|
||||||
} else {
|
} else {
|
||||||
price = litLength * ssPtr->log2litSum;
|
price = litLength * optPtr->log2litSum;
|
||||||
for (u=0; u < litLength; u++)
|
for (u=0; u < litLength; u++)
|
||||||
price -= ZSTD_highbit32(ssPtr->litFreq[literals[u]]+1);
|
price -= ZSTD_highbit32(optPtr->litFreq[literals[u]]+1);
|
||||||
|
|
||||||
if (litLength >= 12) {
|
if (litLength >= 12) {
|
||||||
ssPtr->cachedLiterals = literals;
|
optPtr->cachedLiterals = literals;
|
||||||
ssPtr->cachedPrice = price;
|
optPtr->cachedPrice = price;
|
||||||
ssPtr->cachedLitLength = litLength;
|
optPtr->cachedLitLength = litLength;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/* literal Length */
|
/* literal Length */
|
||||||
{ const BYTE LL_deltaCode = 19;
|
{ const BYTE LL_deltaCode = 19;
|
||||||
const BYTE llCode = (litLength>63) ? (BYTE)ZSTD_highbit32(litLength) + LL_deltaCode : LL_Code[litLength];
|
const BYTE llCode = (litLength>63) ? (BYTE)ZSTD_highbit32(litLength) + LL_deltaCode : LL_Code[litLength];
|
||||||
price += LL_bits[llCode] + ssPtr->log2litLengthSum - ZSTD_highbit32(ssPtr->litLengthFreq[llCode]+1);
|
price += LL_bits[llCode] + optPtr->log2litLengthSum - ZSTD_highbit32(optPtr->litLengthFreq[llCode]+1);
|
||||||
}
|
}
|
||||||
|
|
||||||
return price;
|
return price;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
FORCE_INLINE U32 ZSTD_getPrice(seqStore_t* seqStorePtr, U32 litLength, const BYTE* literals, U32 offset, U32 matchLength, const int ultra)
|
FORCE_INLINE U32 ZSTD_getPrice(optState_t* optPtr, U32 litLength, const BYTE* literals, U32 offset, U32 matchLength, const int ultra)
|
||||||
{
|
{
|
||||||
/* offset */
|
/* offset */
|
||||||
U32 price;
|
U32 price;
|
||||||
BYTE const offCode = (BYTE)ZSTD_highbit32(offset+1);
|
BYTE const offCode = (BYTE)ZSTD_highbit32(offset+1);
|
||||||
|
|
||||||
if (seqStorePtr->staticPrices)
|
if (optPtr->staticPrices)
|
||||||
return ZSTD_getLiteralPrice(seqStorePtr, litLength, literals) + ZSTD_highbit32((U32)matchLength+1) + 16 + offCode;
|
return ZSTD_getLiteralPrice(optPtr, litLength, literals) + ZSTD_highbit32((U32)matchLength+1) + 16 + offCode;
|
||||||
|
|
||||||
price = offCode + seqStorePtr->log2offCodeSum - ZSTD_highbit32(seqStorePtr->offCodeFreq[offCode]+1);
|
price = offCode + optPtr->log2offCodeSum - ZSTD_highbit32(optPtr->offCodeFreq[offCode]+1);
|
||||||
if (!ultra && offCode >= 20) price += (offCode-19)*2;
|
if (!ultra && offCode >= 20) price += (offCode-19)*2;
|
||||||
|
|
||||||
/* match Length */
|
/* match Length */
|
||||||
{ const BYTE ML_deltaCode = 36;
|
{ const BYTE ML_deltaCode = 36;
|
||||||
const BYTE mlCode = (matchLength>127) ? (BYTE)ZSTD_highbit32(matchLength) + ML_deltaCode : ML_Code[matchLength];
|
const BYTE mlCode = (matchLength>127) ? (BYTE)ZSTD_highbit32(matchLength) + ML_deltaCode : ML_Code[matchLength];
|
||||||
price += ML_bits[mlCode] + seqStorePtr->log2matchLengthSum - ZSTD_highbit32(seqStorePtr->matchLengthFreq[mlCode]+1);
|
price += ML_bits[mlCode] + optPtr->log2matchLengthSum - ZSTD_highbit32(optPtr->matchLengthFreq[mlCode]+1);
|
||||||
}
|
}
|
||||||
|
|
||||||
return price + ZSTD_getLiteralPrice(seqStorePtr, litLength, literals) + seqStorePtr->factor;
|
return price + ZSTD_getLiteralPrice(optPtr, litLength, literals) + optPtr->factor;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
MEM_STATIC void ZSTD_updatePrice(seqStore_t* seqStorePtr, U32 litLength, const BYTE* literals, U32 offset, U32 matchLength)
|
MEM_STATIC void ZSTD_updatePrice(optState_t* optPtr, U32 litLength, const BYTE* literals, U32 offset, U32 matchLength)
|
||||||
{
|
{
|
||||||
U32 u;
|
U32 u;
|
||||||
|
|
||||||
/* literals */
|
/* literals */
|
||||||
seqStorePtr->litSum += litLength*ZSTD_LITFREQ_ADD;
|
optPtr->litSum += litLength*ZSTD_LITFREQ_ADD;
|
||||||
for (u=0; u < litLength; u++)
|
for (u=0; u < litLength; u++)
|
||||||
seqStorePtr->litFreq[literals[u]] += ZSTD_LITFREQ_ADD;
|
optPtr->litFreq[literals[u]] += ZSTD_LITFREQ_ADD;
|
||||||
|
|
||||||
/* literal Length */
|
/* literal Length */
|
||||||
{ const BYTE LL_deltaCode = 19;
|
{ const BYTE LL_deltaCode = 19;
|
||||||
const BYTE llCode = (litLength>63) ? (BYTE)ZSTD_highbit32(litLength) + LL_deltaCode : LL_Code[litLength];
|
const BYTE llCode = (litLength>63) ? (BYTE)ZSTD_highbit32(litLength) + LL_deltaCode : LL_Code[litLength];
|
||||||
seqStorePtr->litLengthFreq[llCode]++;
|
optPtr->litLengthFreq[llCode]++;
|
||||||
seqStorePtr->litLengthSum++;
|
optPtr->litLengthSum++;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* match offset */
|
/* match offset */
|
||||||
{ BYTE const offCode = (BYTE)ZSTD_highbit32(offset+1);
|
{ BYTE const offCode = (BYTE)ZSTD_highbit32(offset+1);
|
||||||
seqStorePtr->offCodeSum++;
|
optPtr->offCodeSum++;
|
||||||
seqStorePtr->offCodeFreq[offCode]++;
|
optPtr->offCodeFreq[offCode]++;
|
||||||
}
|
}
|
||||||
|
|
||||||
/* match Length */
|
/* match Length */
|
||||||
{ const BYTE ML_deltaCode = 36;
|
{ const BYTE ML_deltaCode = 36;
|
||||||
const BYTE mlCode = (matchLength>127) ? (BYTE)ZSTD_highbit32(matchLength) + ML_deltaCode : ML_Code[matchLength];
|
const BYTE mlCode = (matchLength>127) ? (BYTE)ZSTD_highbit32(matchLength) + ML_deltaCode : ML_Code[matchLength];
|
||||||
seqStorePtr->matchLengthFreq[mlCode]++;
|
optPtr->matchLengthFreq[mlCode]++;
|
||||||
seqStorePtr->matchLengthSum++;
|
optPtr->matchLengthSum++;
|
||||||
}
|
}
|
||||||
|
|
||||||
ZSTD_setLog2Prices(seqStorePtr);
|
ZSTD_setLog2Prices(optPtr);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
@ -417,6 +417,7 @@ void ZSTD_compressBlock_opt_generic(ZSTD_CCtx* ctx,
|
|||||||
const void* src, size_t srcSize, const int ultra)
|
const void* src, size_t srcSize, const int ultra)
|
||||||
{
|
{
|
||||||
seqStore_t* seqStorePtr = &(ctx->seqStore);
|
seqStore_t* seqStorePtr = &(ctx->seqStore);
|
||||||
|
optState_t* optStatePtr = &(ctx->optState);
|
||||||
const BYTE* const istart = (const BYTE*)src;
|
const BYTE* const istart = (const BYTE*)src;
|
||||||
const BYTE* ip = istart;
|
const BYTE* ip = istart;
|
||||||
const BYTE* anchor = istart;
|
const BYTE* anchor = istart;
|
||||||
@ -430,14 +431,14 @@ void ZSTD_compressBlock_opt_generic(ZSTD_CCtx* ctx,
|
|||||||
const U32 mls = ctx->appliedParams.cParams.searchLength;
|
const U32 mls = ctx->appliedParams.cParams.searchLength;
|
||||||
const U32 minMatch = (ctx->appliedParams.cParams.searchLength == 3) ? 3 : 4;
|
const U32 minMatch = (ctx->appliedParams.cParams.searchLength == 3) ? 3 : 4;
|
||||||
|
|
||||||
ZSTD_optimal_t* opt = seqStorePtr->priceTable;
|
ZSTD_optimal_t* opt = optStatePtr->priceTable;
|
||||||
ZSTD_match_t* matches = seqStorePtr->matchTable;
|
ZSTD_match_t* matches = optStatePtr->matchTable;
|
||||||
const BYTE* inr;
|
const BYTE* inr;
|
||||||
U32 offset, rep[ZSTD_REP_NUM];
|
U32 offset, rep[ZSTD_REP_NUM];
|
||||||
|
|
||||||
/* init */
|
/* init */
|
||||||
ctx->nextToUpdate3 = ctx->nextToUpdate;
|
ctx->nextToUpdate3 = ctx->nextToUpdate;
|
||||||
ZSTD_rescaleFreqs(seqStorePtr, (const BYTE*)src, srcSize);
|
ZSTD_rescaleFreqs(optStatePtr, (const BYTE*)src, srcSize);
|
||||||
ip += (ip==prefixStart);
|
ip += (ip==prefixStart);
|
||||||
{ U32 i; for (i=0; i<ZSTD_REP_NUM; i++) rep[i]=seqStorePtr->rep[i]; }
|
{ U32 i; for (i=0; i<ZSTD_REP_NUM; i++) rep[i]=seqStorePtr->rep[i]; }
|
||||||
|
|
||||||
@ -462,7 +463,7 @@ void ZSTD_compressBlock_opt_generic(ZSTD_CCtx* ctx,
|
|||||||
}
|
}
|
||||||
best_off = i - (ip == anchor);
|
best_off = i - (ip == anchor);
|
||||||
do {
|
do {
|
||||||
price = ZSTD_getPrice(seqStorePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
|
price = ZSTD_getPrice(optStatePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
|
||||||
if (mlen > last_pos || price < opt[mlen].price)
|
if (mlen > last_pos || price < opt[mlen].price)
|
||||||
SET_PRICE(mlen, mlen, i, litlen, price); /* note : macro modifies last_pos */
|
SET_PRICE(mlen, mlen, i, litlen, price); /* note : macro modifies last_pos */
|
||||||
mlen--;
|
mlen--;
|
||||||
@ -487,7 +488,7 @@ void ZSTD_compressBlock_opt_generic(ZSTD_CCtx* ctx,
|
|||||||
mlen = (u>0) ? matches[u-1].len+1 : best_mlen;
|
mlen = (u>0) ? matches[u-1].len+1 : best_mlen;
|
||||||
best_mlen = matches[u].len;
|
best_mlen = matches[u].len;
|
||||||
while (mlen <= best_mlen) {
|
while (mlen <= best_mlen) {
|
||||||
price = ZSTD_getPrice(seqStorePtr, litlen, anchor, matches[u].off-1, mlen - MINMATCH, ultra);
|
price = ZSTD_getPrice(optStatePtr, litlen, anchor, matches[u].off-1, mlen - MINMATCH, ultra);
|
||||||
if (mlen > last_pos || price < opt[mlen].price)
|
if (mlen > last_pos || price < opt[mlen].price)
|
||||||
SET_PRICE(mlen, mlen, matches[u].off, litlen, price); /* note : macro modifies last_pos */
|
SET_PRICE(mlen, mlen, matches[u].off, litlen, price); /* note : macro modifies last_pos */
|
||||||
mlen++;
|
mlen++;
|
||||||
@ -507,12 +508,12 @@ void ZSTD_compressBlock_opt_generic(ZSTD_CCtx* ctx,
|
|||||||
if (opt[cur-1].mlen == 1) {
|
if (opt[cur-1].mlen == 1) {
|
||||||
litlen = opt[cur-1].litlen + 1;
|
litlen = opt[cur-1].litlen + 1;
|
||||||
if (cur > litlen) {
|
if (cur > litlen) {
|
||||||
price = opt[cur - litlen].price + ZSTD_getLiteralPrice(seqStorePtr, litlen, inr-litlen);
|
price = opt[cur - litlen].price + ZSTD_getLiteralPrice(optStatePtr, litlen, inr-litlen);
|
||||||
} else
|
} else
|
||||||
price = ZSTD_getLiteralPrice(seqStorePtr, litlen, anchor);
|
price = ZSTD_getLiteralPrice(optStatePtr, litlen, anchor);
|
||||||
} else {
|
} else {
|
||||||
litlen = 1;
|
litlen = 1;
|
||||||
price = opt[cur - 1].price + ZSTD_getLiteralPrice(seqStorePtr, litlen, inr-1);
|
price = opt[cur - 1].price + ZSTD_getLiteralPrice(optStatePtr, litlen, inr-1);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (cur > last_pos || price <= opt[cur].price)
|
if (cur > last_pos || price <= opt[cur].price)
|
||||||
@ -554,12 +555,12 @@ void ZSTD_compressBlock_opt_generic(ZSTD_CCtx* ctx,
|
|||||||
if (opt[cur].mlen == 1) {
|
if (opt[cur].mlen == 1) {
|
||||||
litlen = opt[cur].litlen;
|
litlen = opt[cur].litlen;
|
||||||
if (cur > litlen) {
|
if (cur > litlen) {
|
||||||
price = opt[cur - litlen].price + ZSTD_getPrice(seqStorePtr, litlen, inr-litlen, best_off, mlen - MINMATCH, ultra);
|
price = opt[cur - litlen].price + ZSTD_getPrice(optStatePtr, litlen, inr-litlen, best_off, mlen - MINMATCH, ultra);
|
||||||
} else
|
} else
|
||||||
price = ZSTD_getPrice(seqStorePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
|
price = ZSTD_getPrice(optStatePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
|
||||||
} else {
|
} else {
|
||||||
litlen = 0;
|
litlen = 0;
|
||||||
price = opt[cur].price + ZSTD_getPrice(seqStorePtr, 0, NULL, best_off, mlen - MINMATCH, ultra);
|
price = opt[cur].price + ZSTD_getPrice(optStatePtr, 0, NULL, best_off, mlen - MINMATCH, ultra);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (cur + mlen > last_pos || price <= opt[cur + mlen].price)
|
if (cur + mlen > last_pos || price <= opt[cur + mlen].price)
|
||||||
@ -586,12 +587,12 @@ void ZSTD_compressBlock_opt_generic(ZSTD_CCtx* ctx,
|
|||||||
if (opt[cur].mlen == 1) {
|
if (opt[cur].mlen == 1) {
|
||||||
litlen = opt[cur].litlen;
|
litlen = opt[cur].litlen;
|
||||||
if (cur > litlen)
|
if (cur > litlen)
|
||||||
price = opt[cur - litlen].price + ZSTD_getPrice(seqStorePtr, litlen, ip+cur-litlen, matches[u].off-1, mlen - MINMATCH, ultra);
|
price = opt[cur - litlen].price + ZSTD_getPrice(optStatePtr, litlen, ip+cur-litlen, matches[u].off-1, mlen - MINMATCH, ultra);
|
||||||
else
|
else
|
||||||
price = ZSTD_getPrice(seqStorePtr, litlen, anchor, matches[u].off-1, mlen - MINMATCH, ultra);
|
price = ZSTD_getPrice(optStatePtr, litlen, anchor, matches[u].off-1, mlen - MINMATCH, ultra);
|
||||||
} else {
|
} else {
|
||||||
litlen = 0;
|
litlen = 0;
|
||||||
price = opt[cur].price + ZSTD_getPrice(seqStorePtr, 0, NULL, matches[u].off-1, mlen - MINMATCH, ultra);
|
price = opt[cur].price + ZSTD_getPrice(optStatePtr, 0, NULL, matches[u].off-1, mlen - MINMATCH, ultra);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (cur + mlen > last_pos || (price < opt[cur + mlen].price))
|
if (cur + mlen > last_pos || (price < opt[cur + mlen].price))
|
||||||
@ -645,7 +646,7 @@ _storeSequence: /* cur, last_pos, best_mlen, best_off have to be set */
|
|||||||
if (litLength==0) offset--;
|
if (litLength==0) offset--;
|
||||||
}
|
}
|
||||||
|
|
||||||
ZSTD_updatePrice(seqStorePtr, litLength, anchor, offset, mlen-MINMATCH);
|
ZSTD_updatePrice(optStatePtr, litLength, anchor, offset, mlen-MINMATCH);
|
||||||
ZSTD_storeSeq(seqStorePtr, litLength, anchor, offset, mlen-MINMATCH);
|
ZSTD_storeSeq(seqStorePtr, litLength, anchor, offset, mlen-MINMATCH);
|
||||||
anchor = ip = ip + mlen;
|
anchor = ip = ip + mlen;
|
||||||
} } /* for (cur=0; cur < last_pos; ) */
|
} } /* for (cur=0; cur < last_pos; ) */
|
||||||
@ -666,6 +667,7 @@ void ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx* ctx,
|
|||||||
const void* src, size_t srcSize, const int ultra)
|
const void* src, size_t srcSize, const int ultra)
|
||||||
{
|
{
|
||||||
seqStore_t* seqStorePtr = &(ctx->seqStore);
|
seqStore_t* seqStorePtr = &(ctx->seqStore);
|
||||||
|
optState_t* optStatePtr = &(ctx->optState);
|
||||||
const BYTE* const istart = (const BYTE*)src;
|
const BYTE* const istart = (const BYTE*)src;
|
||||||
const BYTE* ip = istart;
|
const BYTE* ip = istart;
|
||||||
const BYTE* anchor = istart;
|
const BYTE* anchor = istart;
|
||||||
@ -683,8 +685,8 @@ void ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx* ctx,
|
|||||||
const U32 mls = ctx->appliedParams.cParams.searchLength;
|
const U32 mls = ctx->appliedParams.cParams.searchLength;
|
||||||
const U32 minMatch = (ctx->appliedParams.cParams.searchLength == 3) ? 3 : 4;
|
const U32 minMatch = (ctx->appliedParams.cParams.searchLength == 3) ? 3 : 4;
|
||||||
|
|
||||||
ZSTD_optimal_t* opt = seqStorePtr->priceTable;
|
ZSTD_optimal_t* opt = optStatePtr->priceTable;
|
||||||
ZSTD_match_t* matches = seqStorePtr->matchTable;
|
ZSTD_match_t* matches = optStatePtr->matchTable;
|
||||||
const BYTE* inr;
|
const BYTE* inr;
|
||||||
|
|
||||||
/* init */
|
/* init */
|
||||||
@ -692,7 +694,7 @@ void ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx* ctx,
|
|||||||
{ U32 i; for (i=0; i<ZSTD_REP_NUM; i++) rep[i]=seqStorePtr->rep[i]; }
|
{ U32 i; for (i=0; i<ZSTD_REP_NUM; i++) rep[i]=seqStorePtr->rep[i]; }
|
||||||
|
|
||||||
ctx->nextToUpdate3 = ctx->nextToUpdate;
|
ctx->nextToUpdate3 = ctx->nextToUpdate;
|
||||||
ZSTD_rescaleFreqs(seqStorePtr, (const BYTE*)src, srcSize);
|
ZSTD_rescaleFreqs(optStatePtr, (const BYTE*)src, srcSize);
|
||||||
ip += (ip==prefixStart);
|
ip += (ip==prefixStart);
|
||||||
|
|
||||||
/* Match Loop */
|
/* Match Loop */
|
||||||
@ -726,7 +728,7 @@ void ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx* ctx,
|
|||||||
best_off = i - (ip==anchor);
|
best_off = i - (ip==anchor);
|
||||||
litlen = opt[0].litlen;
|
litlen = opt[0].litlen;
|
||||||
do {
|
do {
|
||||||
price = ZSTD_getPrice(seqStorePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
|
price = ZSTD_getPrice(optStatePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
|
||||||
if (mlen > last_pos || price < opt[mlen].price)
|
if (mlen > last_pos || price < opt[mlen].price)
|
||||||
SET_PRICE(mlen, mlen, i, litlen, price); /* note : macro modifies last_pos */
|
SET_PRICE(mlen, mlen, i, litlen, price); /* note : macro modifies last_pos */
|
||||||
mlen--;
|
mlen--;
|
||||||
@ -756,7 +758,7 @@ void ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx* ctx,
|
|||||||
best_mlen = matches[u].len;
|
best_mlen = matches[u].len;
|
||||||
litlen = opt[0].litlen;
|
litlen = opt[0].litlen;
|
||||||
while (mlen <= best_mlen) {
|
while (mlen <= best_mlen) {
|
||||||
price = ZSTD_getPrice(seqStorePtr, litlen, anchor, matches[u].off-1, mlen - MINMATCH, ultra);
|
price = ZSTD_getPrice(optStatePtr, litlen, anchor, matches[u].off-1, mlen - MINMATCH, ultra);
|
||||||
if (mlen > last_pos || price < opt[mlen].price)
|
if (mlen > last_pos || price < opt[mlen].price)
|
||||||
SET_PRICE(mlen, mlen, matches[u].off, litlen, price);
|
SET_PRICE(mlen, mlen, matches[u].off, litlen, price);
|
||||||
mlen++;
|
mlen++;
|
||||||
@ -773,12 +775,12 @@ void ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx* ctx,
|
|||||||
if (opt[cur-1].mlen == 1) {
|
if (opt[cur-1].mlen == 1) {
|
||||||
litlen = opt[cur-1].litlen + 1;
|
litlen = opt[cur-1].litlen + 1;
|
||||||
if (cur > litlen) {
|
if (cur > litlen) {
|
||||||
price = opt[cur - litlen].price + ZSTD_getLiteralPrice(seqStorePtr, litlen, inr-litlen);
|
price = opt[cur - litlen].price + ZSTD_getLiteralPrice(optStatePtr, litlen, inr-litlen);
|
||||||
} else
|
} else
|
||||||
price = ZSTD_getLiteralPrice(seqStorePtr, litlen, anchor);
|
price = ZSTD_getLiteralPrice(optStatePtr, litlen, anchor);
|
||||||
} else {
|
} else {
|
||||||
litlen = 1;
|
litlen = 1;
|
||||||
price = opt[cur - 1].price + ZSTD_getLiteralPrice(seqStorePtr, litlen, inr-1);
|
price = opt[cur - 1].price + ZSTD_getLiteralPrice(optStatePtr, litlen, inr-1);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (cur > last_pos || price <= opt[cur].price)
|
if (cur > last_pos || price <= opt[cur].price)
|
||||||
@ -826,12 +828,12 @@ void ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx* ctx,
|
|||||||
if (opt[cur].mlen == 1) {
|
if (opt[cur].mlen == 1) {
|
||||||
litlen = opt[cur].litlen;
|
litlen = opt[cur].litlen;
|
||||||
if (cur > litlen) {
|
if (cur > litlen) {
|
||||||
price = opt[cur - litlen].price + ZSTD_getPrice(seqStorePtr, litlen, inr-litlen, best_off, mlen - MINMATCH, ultra);
|
price = opt[cur - litlen].price + ZSTD_getPrice(optStatePtr, litlen, inr-litlen, best_off, mlen - MINMATCH, ultra);
|
||||||
} else
|
} else
|
||||||
price = ZSTD_getPrice(seqStorePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
|
price = ZSTD_getPrice(optStatePtr, litlen, anchor, best_off, mlen - MINMATCH, ultra);
|
||||||
} else {
|
} else {
|
||||||
litlen = 0;
|
litlen = 0;
|
||||||
price = opt[cur].price + ZSTD_getPrice(seqStorePtr, 0, NULL, best_off, mlen - MINMATCH, ultra);
|
price = opt[cur].price + ZSTD_getPrice(optStatePtr, 0, NULL, best_off, mlen - MINMATCH, ultra);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (cur + mlen > last_pos || price <= opt[cur + mlen].price)
|
if (cur + mlen > last_pos || price <= opt[cur + mlen].price)
|
||||||
@ -858,12 +860,12 @@ void ZSTD_compressBlock_opt_extDict_generic(ZSTD_CCtx* ctx,
|
|||||||
if (opt[cur].mlen == 1) {
|
if (opt[cur].mlen == 1) {
|
||||||
litlen = opt[cur].litlen;
|
litlen = opt[cur].litlen;
|
||||||
if (cur > litlen)
|
if (cur > litlen)
|
||||||
price = opt[cur - litlen].price + ZSTD_getPrice(seqStorePtr, litlen, ip+cur-litlen, matches[u].off-1, mlen - MINMATCH, ultra);
|
price = opt[cur - litlen].price + ZSTD_getPrice(optStatePtr, litlen, ip+cur-litlen, matches[u].off-1, mlen - MINMATCH, ultra);
|
||||||
else
|
else
|
||||||
price = ZSTD_getPrice(seqStorePtr, litlen, anchor, matches[u].off-1, mlen - MINMATCH, ultra);
|
price = ZSTD_getPrice(optStatePtr, litlen, anchor, matches[u].off-1, mlen - MINMATCH, ultra);
|
||||||
} else {
|
} else {
|
||||||
litlen = 0;
|
litlen = 0;
|
||||||
price = opt[cur].price + ZSTD_getPrice(seqStorePtr, 0, NULL, matches[u].off-1, mlen - MINMATCH, ultra);
|
price = opt[cur].price + ZSTD_getPrice(optStatePtr, 0, NULL, matches[u].off-1, mlen - MINMATCH, ultra);
|
||||||
}
|
}
|
||||||
|
|
||||||
if (cur + mlen > last_pos || (price < opt[cur + mlen].price))
|
if (cur + mlen > last_pos || (price < opt[cur + mlen].price))
|
||||||
@ -918,7 +920,7 @@ _storeSequence: /* cur, last_pos, best_mlen, best_off have to be set */
|
|||||||
if (litLength==0) offset--;
|
if (litLength==0) offset--;
|
||||||
}
|
}
|
||||||
|
|
||||||
ZSTD_updatePrice(seqStorePtr, litLength, anchor, offset, mlen-MINMATCH);
|
ZSTD_updatePrice(optStatePtr, litLength, anchor, offset, mlen-MINMATCH);
|
||||||
ZSTD_storeSeq(seqStorePtr, litLength, anchor, offset, mlen-MINMATCH);
|
ZSTD_storeSeq(seqStorePtr, litLength, anchor, offset, mlen-MINMATCH);
|
||||||
anchor = ip = ip + mlen;
|
anchor = ip = ip + mlen;
|
||||||
} } /* for (cur=0; cur < last_pos; ) */
|
} } /* for (cur=0; cur < last_pos; ) */
|
||||||
|
Loading…
Reference in New Issue
Block a user