removes matches[] table

saves stack space
clearer match finder interface (no more table to fill)
This commit is contained in:
Yann Collet 2017-11-03 01:37:43 -07:00
parent 320e1d51ac
commit 3b222d2d96

View File

@ -88,18 +88,18 @@ int LZ4HC_FindLongerMatch(LZ4HC_CCtx_internal* const ctx, /* Index table will
return LZ4HC_InsertAndGetWiderMatch(ctx, ip, ip, iHighLimit, longest, matchpos, &uselessPtr, maxNbAttempts); return LZ4HC_InsertAndGetWiderMatch(ctx, ip, ip, iHighLimit, longest, matchpos, &uselessPtr, maxNbAttempts);
} }
LZ4_FORCE_INLINE int LZ4HC_HashChain_GetAllMatches ( LZ4_FORCE_INLINE
LZ4HC_CCtx_internal* ctx, LZ4HC_match_t LZ4HC_HashChain_GetAllMatches (LZ4HC_CCtx_internal* const ctx,
const BYTE* const ip, const BYTE* const iHighLimit, const BYTE* const ip, const BYTE* const iHighLimit,
size_t best_mlen, LZ4HC_match_t* matches) size_t best_mlen)
{ {
LZ4HC_match_t match = {0 , 0};
const BYTE* matchPtr = NULL; const BYTE* matchPtr = NULL;
int matchLength = LZ4HC_FindLongerMatch(ctx, ip, iHighLimit, (int)best_mlen, &matchPtr, ctx->searchNum); int matchLength = LZ4HC_FindLongerMatch(ctx, ip, iHighLimit, (int)best_mlen, &matchPtr, ctx->searchNum);
if ((size_t)matchLength <= best_mlen) return 0; if ((size_t)matchLength <= best_mlen) return match;
assert(matches != NULL); match.len = matchLength;
matches[0].len = matchLength; match.off = (int)(ip-matchPtr);
matches[0].off = (int)(ip-matchPtr); return match;
return 1;
} }
@ -115,7 +115,6 @@ static int LZ4HC_compress_optimal (
) )
{ {
LZ4HC_optimal_t opt[LZ4_OPT_NUM + 3]; /* this uses a bit too much stack memory to my taste ... */ LZ4HC_optimal_t opt[LZ4_OPT_NUM + 3]; /* this uses a bit too much stack memory to my taste ... */
LZ4HC_match_t matches[LZ4_OPT_NUM + 1];
const BYTE* ip = (const BYTE*) source; const BYTE* ip = (const BYTE*) source;
const BYTE* anchor = ip; const BYTE* anchor = ip;
@ -138,13 +137,13 @@ static int LZ4HC_compress_optimal (
int best_mlen, best_off; int best_mlen, best_off;
int cur, last_match_pos = 0; int cur, last_match_pos = 0;
int const nb_matches_initial = LZ4HC_HashChain_GetAllMatches(ctx, ip, matchlimit, MINMATCH-1, matches); LZ4HC_match_t const firstMatch = LZ4HC_HashChain_GetAllMatches(ctx, ip, matchlimit, MINMATCH-1);
if (!nb_matches_initial) { ip++; continue; } if (firstMatch.len==0) { ip++; continue; }
if ((size_t)matches[nb_matches_initial-1].len > sufficient_len) { if ((size_t)firstMatch.len > sufficient_len) {
/* good enough solution : immediate encoding */ /* good enough solution : immediate encoding */
int const firstML = matches[nb_matches_initial-1].len; int const firstML = firstMatch.len;
const BYTE* const matchPos = ip - matches[nb_matches_initial-1].off; const BYTE* const matchPos = ip - firstMatch.off;
if ( LZ4HC_encodeSequence(&ip, &op, &anchor, firstML, matchPos, limit, oend) ) /* updates ip, op and anchor */ if ( LZ4HC_encodeSequence(&ip, &op, &anchor, firstML, matchPos, limit, oend) ) /* updates ip, op and anchor */
return 0; /* error */ return 0; /* error */
continue; continue;
@ -162,11 +161,9 @@ static int LZ4HC_compress_optimal (
rPos, cost, opt[rPos].litlen); rPos, cost, opt[rPos].litlen);
} } } }
/* set prices using matches found for rPos = 0 */ /* set prices using matches found for rPos = 0 */
{ int matchNb; { int mlen = MINMATCH;
for (matchNb = 0; matchNb < nb_matches_initial; matchNb++) { int const matchML = firstMatch.len; /* necessarily < sufficient_len < LZ4_OPT_NUM */
int mlen = (matchNb>0) ? matches[matchNb-1].len+1 : MINMATCH; int const offset = firstMatch.off;
int const matchML = matches[matchNb].len; /* necessarily < sufficient_len < LZ4_OPT_NUM */
int const offset = matches[matchNb].off;
assert(matchML < LZ4_OPT_NUM); assert(matchML < LZ4_OPT_NUM);
for ( ; mlen <= matchML ; mlen++) { for ( ; mlen <= matchML ; mlen++) {
int const cost = LZ4HC_sequencePrice(llen, mlen); int const cost = LZ4HC_sequencePrice(llen, mlen);
@ -176,8 +173,8 @@ static int LZ4HC_compress_optimal (
opt[mlen].price = cost; opt[mlen].price = cost;
DEBUGLOG(7, "rPos:%3i => price:%3i (matchlen=%i) -- initial setup", DEBUGLOG(7, "rPos:%3i => price:%3i (matchlen=%i) -- initial setup",
mlen, cost, mlen); mlen, cost, mlen);
} } } } }
last_match_pos = matches[nb_matches_initial-1].len; last_match_pos = firstMatch.len;
{ int addLit; { int addLit;
for (addLit = 1; addLit <= 3; addLit ++) { for (addLit = 1; addLit <= 3; addLit ++) {
opt[last_match_pos+addLit].mlen = 1; /* literal */ opt[last_match_pos+addLit].mlen = 1; /* literal */
@ -191,7 +188,7 @@ static int LZ4HC_compress_optimal (
/* check further positions */ /* check further positions */
for (cur = 1; cur < last_match_pos; cur++) { for (cur = 1; cur < last_match_pos; cur++) {
const BYTE* const curPtr = ip + cur; const BYTE* const curPtr = ip + cur;
int nb_matches; LZ4HC_match_t newMatch;
if (curPtr >= mflimit) break; if (curPtr >= mflimit) break;
DEBUGLOG(7, "rPos:%u[%u] vs [%u]%u", DEBUGLOG(7, "rPos:%u[%u] vs [%u]%u",
@ -204,16 +201,16 @@ static int LZ4HC_compress_optimal (
DEBUGLOG(7, "search at rPos:%u", cur); DEBUGLOG(7, "search at rPos:%u", cur);
if (fullUpdate) if (fullUpdate)
nb_matches = LZ4HC_HashChain_GetAllMatches(ctx, curPtr, matchlimit, MINMATCH-1, matches); newMatch = LZ4HC_HashChain_GetAllMatches(ctx, curPtr, matchlimit, MINMATCH-1);
else else
nb_matches = LZ4HC_HashChain_GetAllMatches(ctx, curPtr, matchlimit, last_match_pos - cur, matches); /* only test matches of a minimum length; slightly faster, but misses a few bytes */ newMatch = LZ4HC_HashChain_GetAllMatches(ctx, curPtr, matchlimit, last_match_pos - cur); /* only test matches of a minimum length; slightly faster, but misses a few bytes */
if (!nb_matches) continue; if (!newMatch.len) continue;
if ( ((size_t)matches[nb_matches-1].len > sufficient_len) if ( ((size_t)newMatch.len > sufficient_len)
|| (matches[nb_matches-1].len + cur >= LZ4_OPT_NUM) ) { || (newMatch.len + cur >= LZ4_OPT_NUM) ) {
/* immediate encoding */ /* immediate encoding */
best_mlen = matches[nb_matches-1].len; best_mlen = newMatch.len;
best_off = matches[nb_matches-1].off; best_off = newMatch.off;
last_match_pos = cur + 1; last_match_pos = cur + 1;
goto encode; goto encode;
} }
@ -234,15 +231,13 @@ static int LZ4HC_compress_optimal (
} } } } } }
/* set prices using matches at position = cur */ /* set prices using matches at position = cur */
{ int matchNb; { int const matchML = newMatch.len;
assert(cur + matches[nb_matches-1].len < LZ4_OPT_NUM); int ml = MINMATCH;
for (matchNb = 0; matchNb < nb_matches; matchNb++) {
int const matchML = matches[matchNb].len;
int ml = (matchNb>0) ? matches[matchNb-1].len+1 : MINMATCH;
assert(cur + newMatch.len < LZ4_OPT_NUM);
for ( ; ml <= matchML ; ml++) { for ( ; ml <= matchML ; ml++) {
int const pos = cur + ml; int const pos = cur + ml;
int const offset = matches[matchNb].off; int const offset = newMatch.off;
int price; int price;
int ll; int ll;
DEBUGLOG(7, "testing price rPos %i (last_match_pos=%i)", DEBUGLOG(7, "testing price rPos %i (last_match_pos=%i)",
@ -260,15 +255,14 @@ static int LZ4HC_compress_optimal (
DEBUGLOG(7, "rPos:%3i => price:%3i (matchlen=%i)", DEBUGLOG(7, "rPos:%3i => price:%3i (matchlen=%i)",
pos, price, ml); pos, price, ml);
assert(pos < LZ4_OPT_NUM); assert(pos < LZ4_OPT_NUM);
if ( (matchNb == nb_matches-1) /* last match */ if ( (ml == matchML) /* last post of last match */
&& (ml == matchML) /* last post of last match */
&& (last_match_pos < pos) ) && (last_match_pos < pos) )
last_match_pos = pos; last_match_pos = pos;
opt[pos].mlen = ml; opt[pos].mlen = ml;
opt[pos].off = offset; opt[pos].off = offset;
opt[pos].litlen = ll; opt[pos].litlen = ll;
opt[pos].price = price; opt[pos].price = price;
} } } } } } }
/* complete following positions with literals */ /* complete following positions with literals */
{ int addLit; { int addLit;
for (addLit = 1; addLit <= 3; addLit ++) { for (addLit = 1; addLit <= 3; addLit ++) {