From 90fa770458606bf098d8bc1e5d1e6a9aa72b4337 Mon Sep 17 00:00:00 2001 From: Emmanuel Marty Date: Mon, 27 Jul 2020 13:25:16 +0200 Subject: [PATCH] Compress another 8% faster --- src/shrink_block_v2.c | 8 +++++++- src/shrink_context.h | 1 + 2 files changed, 8 insertions(+), 1 deletion(-) diff --git a/src/shrink_block_v2.c b/src/shrink_block_v2.c index bbb746e..7743d37 100644 --- a/src/shrink_block_v2.c +++ b/src/shrink_block_v2.c @@ -271,9 +271,11 @@ static void lzsa_insert_forward_match_v2(lzsa_compressor *pCompressor, const uns static void lzsa_optimize_forward_v2(lzsa_compressor *pCompressor, const unsigned char *pInWindow, lzsa_match *pBestMatch, const int nStartOffset, const int nEndOffset, const int nReduce, const int nInsertForwardReps, const int nArrivalsPerPosition) { lzsa_arrival *arrival = pCompressor->arrival - (nStartOffset << ARRIVALS_PER_POSITION_SHIFT); const int* rle_end = (int*)pCompressor->intervals /* reuse */; + char* rep_inserted = pCompressor->rep_inserted; const int nModeSwitchPenalty = (pCompressor->flags & LZSA_FLAG_FAVOR_RATIO) ? 0 : MODESWITCH_PENALTY; const int nMinMatchSize = pCompressor->min_match_size; const int nDisableScore = nReduce ? 0 : (2 * BLOCK_SIZE); + const int nMaxRepInsertedLen = nReduce ? 64 : 0; const int nLeaveAloneMatchSize = (nArrivalsPerPosition == NARRIVALS_PER_POSITION_V2_SMALL) ? LEAVE_ALONE_MATCH_SIZE_SMALL : LEAVE_ALONE_MATCH_SIZE; int i, j, n; @@ -382,6 +384,7 @@ static void lzsa_optimize_forward_v2(lzsa_compressor *pCompressor, const unsigne int nMinRepLen[NARRIVALS_PER_POSITION_V2_BIG]; memset(nMinRepLen, 0, nArrivalsPerPosition * sizeof(int)); + memset(rep_inserted, 0, NARRIVALS_PER_POSITION_V2_BIG * (64 / 8) * sizeof(char)); for (j = 0; j < nNumArrivalsForThisPos; j++) { int nRepOffset = cur_arrival[j].rep_offset; @@ -548,7 +551,7 @@ static void lzsa_optimize_forward_v2(lzsa_compressor *pCompressor, const unsigne if (k <= nMaxOverallRepLen) { for (j = 0; j < nNumArrivalsForThisPos; j++) { - if (nMinRepLen[j] >= k) { + if (nMinRepLen[j] >= k && (k >= 64 || (rep_inserted[(j << 3) + (k >> 3)] & (1 << (k & 7))) == 0)) { const int nPrevCost = cur_arrival[j].cost & 0x3fffffff; int nRepCodingChoiceCost = nPrevCost /* the actual cost of the literals themselves accumulates up the chain */ + nMatchLenCost; int nScore = cur_arrival[j].score + 2; @@ -616,6 +619,9 @@ static void lzsa_optimize_forward_v2(lzsa_compressor *pCompressor, const unsigne } } } + + if (k < nMaxRepInsertedLen) + rep_inserted[(j << 3) + (k >> 3)] |= (1 << (k & 7)); } else { break; diff --git a/src/shrink_context.h b/src/shrink_context.h index b1dcbd7..62fe4a0 100644 --- a/src/shrink_context.h +++ b/src/shrink_context.h @@ -129,6 +129,7 @@ typedef struct _lzsa_compressor { int flags; int safe_dist; int num_commands; + char rep_inserted[NARRIVALS_PER_POSITION_V2_BIG * (64 / 8)]; lzsa_stats stats; } lzsa_compressor;