Files
easy7zip/C/fast-lzma2/lzma2_enc.c
2018-11-05 21:22:10 +10:00

2048 lines
78 KiB
C

/* lzma2_enc.c -- LZMA2 Encoder
Based on LzmaEnc.c and Lzma2Enc.c : Igor Pavlov
Modified for FL2 by Conor McCarthy
Public domain
*/
#include <stdlib.h>
#include <math.h>
#include "fl2_internal.h"
#include "mem.h"
#include "lzma2_enc.h"
#include "fl2_compress_internal.h"
#include "radix_mf.h"
#include "range_enc.h"
#include "count.h"
#define kNumReps 4U
#define kNumStates 12U
#define kNumLiterals 0x100U
#define kNumLitTables 3U
#define kNumLenToPosStates 4U
#define kNumPosSlotBits 6U
#define kDicLogSizeMin 18U
#define kDicLogSizeMax 31U
#define kDistTableSizeMax (kDicLogSizeMax * 2U)
#define kNumAlignBits 4U
#define kAlignTableSize (1U << kNumAlignBits)
#define kAlignMask (kAlignTableSize - 1U)
#define kAlignRepriceFrequency kAlignTableSize
#define kStartPosModelIndex 4U
#define kEndPosModelIndex 14U
#define kNumPosModels (kEndPosModelIndex - kStartPosModelIndex)
#define kNumFullDistancesBits (kEndPosModelIndex >> 1U)
#define kNumFullDistances (1U << kNumFullDistancesBits)
#define kDistanceRepriceFrequency (1U << 7U)
#define kNumPositionBitsMax 4U
#define kNumPositionStatesMax (1U << kNumPositionBitsMax)
#define kNumLiteralContextBitsMax 4U
#define kNumLiteralPosBitsMax 4U
#define kLcLpMax 4U
#define kLenNumLowBits 3U
#define kLenNumLowSymbols (1U << kLenNumLowBits)
#define kLenNumMidBits 3U
#define kLenNumMidSymbols (1U << kLenNumMidBits)
#define kLenNumHighBits 8U
#define kLenNumHighSymbols (1U << kLenNumHighBits)
#define kLenNumSymbolsTotal (kLenNumLowSymbols + kLenNumMidSymbols + kLenNumHighSymbols)
#define kMatchLenMin 2U
#define kMatchLenMax (kMatchLenMin + kLenNumSymbolsTotal - 1U)
#define kOptimizerBufferSize (1U << 12U)
#define kInfinityPrice (1UL << 30U)
#define kNullDist (U32)-1
#define kChunkSize ((1UL << 16U) - 8192U)
#define kChunkBufferSize (1UL << 16U)
#define kMaxChunkUncompressedSize ((1UL << 21U) - kMatchLenMax)
#define kChunkHeaderSize 5U
#define kChunkResetShift 5U
#define kChunkUncompressedDictReset 1U
#define kChunkUncompressed 2U
#define kChunkCompressedFlag 0x80U
#define kChunkNothingReset 0U
#define kChunkStateReset (1U << kChunkResetShift)
#define kChunkStatePropertiesReset (2U << kChunkResetShift)
#define kChunkAllReset (3U << kChunkResetShift)
#define kMaxHashDictBits 14U
#define kHash3Bits 14U
#define kNullLink -1
#define kMinTestChunkSize 0x4000U
#define kRandomFilterMarginBits 8U
static const BYTE kLiteralNextStates[kNumStates] = { 0, 0, 0, 0, 1, 2, 3, 4, 5, 6, 4, 5 };
#define LiteralNextState(s) kLiteralNextStates[s]
static const BYTE kMatchNextStates[kNumStates] = { 7, 7, 7, 7, 7, 7, 7, 10, 10, 10, 10, 10 };
#define MatchNextState(s) kMatchNextStates[s]
static const BYTE kRepNextStates[kNumStates] = { 8, 8, 8, 8, 8, 8, 8, 11, 11, 11, 11, 11 };
#define RepNextState(s) kRepNextStates[s]
static const BYTE kShortRepNextStates[kNumStates] = { 9, 9, 9, 9, 9, 9, 9, 11, 11, 11, 11, 11 };
#define ShortRepNextState(s) kShortRepNextStates[s]
#include "fastpos_table.h"
typedef struct
{
size_t table_size;
unsigned prices[kNumPositionStatesMax][kLenNumSymbolsTotal];
unsigned counters[kNumPositionStatesMax];
Probability choice;
Probability choice_2;
Probability low[kNumPositionStatesMax << kLenNumLowBits];
Probability mid[kNumPositionStatesMax << kLenNumMidBits];
Probability high[kLenNumHighSymbols];
} LengthStates;
typedef struct
{
U32 reps[kNumReps];
size_t state;
Probability is_rep[kNumStates];
Probability is_rep_G0[kNumStates];
Probability is_rep_G1[kNumStates];
Probability is_rep_G2[kNumStates];
Probability is_rep0_long[kNumStates][kNumPositionStatesMax];
Probability is_match[kNumStates][kNumPositionStatesMax];
Probability dist_slot_encoders[kNumLenToPosStates][1 << kNumPosSlotBits];
Probability dist_align_encoders[1 << kNumAlignBits];
Probability dist_encoders[kNumFullDistances - kEndPosModelIndex];
LengthStates len_states;
LengthStates rep_len_states;
Probability literal_probs[(kNumLiterals * kNumLitTables) << kLcLpMax];
} EncoderStates;
typedef struct
{
size_t state;
U32 reps[kNumReps];
U32 price;
unsigned prev_index;
U32 prev_dist;
unsigned prev_index_2;
U32 prev_dist_2;
BYTE is_combination;
BYTE prev_2;
} OptimalNode;
#define MakeAsLiteral(node) (node).prev_dist = kNullDist; (node).is_combination = 0;
#define MakeAsShortRep(node) (node).prev_dist = 0; (node).is_combination = 0;
typedef struct {
S32 table_3[1 << kHash3Bits];
S32 hash_chain_3[1];
} HashChains;
typedef struct
{
U32 length;
U32 dist;
} Match;
struct FL2_lzmaEncoderCtx_s
{
unsigned lc;
unsigned lp;
unsigned pb;
unsigned fast_length;
size_t len_end_max;
size_t lit_pos_mask;
size_t pos_mask;
unsigned match_cycles;
FL2_strategy strategy;
RangeEncoder rc;
EncoderStates states;
unsigned match_price_count;
unsigned align_price_count;
size_t dist_price_table_size;
unsigned align_prices[kAlignTableSize];
unsigned dist_slot_prices[kNumLenToPosStates][kDistTableSizeMax];
unsigned distance_prices[kNumLenToPosStates][kNumFullDistances];
Match matches[kMatchLenMax-kMatchLenMin];
size_t match_count;
OptimalNode opt_buf[kOptimizerBufferSize];
BYTE* out_buf;
HashChains* hash_buf;
ptrdiff_t chain_mask_2;
ptrdiff_t chain_mask_3;
ptrdiff_t hash_dict_3;
ptrdiff_t hash_prev_index;
ptrdiff_t hash_alloc_3;
};
FL2_lzmaEncoderCtx* FL2_lzma2Create()
{
FL2_lzmaEncoderCtx* enc = malloc(sizeof(FL2_lzmaEncoderCtx));
DEBUGLOG(3, "FL2_lzma2Create");
if (enc == NULL)
return NULL;
enc->out_buf = malloc(kChunkBufferSize);
if (enc->out_buf == NULL) {
free(enc);
return NULL;
}
enc->lc = 3;
enc->lp = 0;
enc->pb = 2;
enc->fast_length = 48;
enc->len_end_max = kOptimizerBufferSize - 1;
enc->lit_pos_mask = (1 << enc->lp) - 1;
enc->pos_mask = (1 << enc->pb) - 1;
enc->match_cycles = 1;
enc->strategy = FL2_ultra;
enc->match_price_count = kDistanceRepriceFrequency;
enc->align_price_count = kAlignRepriceFrequency;
enc->dist_price_table_size = kDistTableSizeMax;
enc->hash_buf = NULL;
enc->hash_dict_3 = 0;
enc->chain_mask_3 = 0;
enc->hash_alloc_3 = 0;
return enc;
}
void FL2_lzma2Free(FL2_lzmaEncoderCtx* enc)
{
if (enc == NULL)
return;
free(enc->hash_buf);
free(enc->out_buf);
free(enc);
}
#define GetLiteralProbs(enc, pos, prev_symbol) (enc->states.literal_probs + ((((pos) & enc->lit_pos_mask) << enc->lc) + ((prev_symbol) >> (8 - enc->lc))) * kNumLiterals * kNumLitTables)
#define GetLenToDistState(len) (((len) < kNumLenToPosStates + 1) ? (len) - 2 : kNumLenToPosStates - 1)
#define IsCharState(state) ((state) < 7)
HINT_INLINE
unsigned GetRepLen1Price(FL2_lzmaEncoderCtx* enc, size_t state, size_t pos_state)
{
unsigned rep_G0_prob = enc->states.is_rep_G0[state];
unsigned rep0_long_prob = enc->states.is_rep0_long[state][pos_state];
return GET_PRICE_0(enc->rc, rep_G0_prob) + GET_PRICE_0(enc->rc, rep0_long_prob);
}
static unsigned GetRepPrice(FL2_lzmaEncoderCtx* enc, size_t rep_index, size_t state, size_t pos_state)
{
unsigned price;
unsigned rep_G0_prob = enc->states.is_rep_G0[state];
if (rep_index == 0) {
unsigned rep0_long_prob = enc->states.is_rep0_long[state][pos_state];
price = GET_PRICE_0(enc->rc, rep_G0_prob);
price += GET_PRICE_1(enc->rc, rep0_long_prob);
}
else {
unsigned rep_G1_prob = enc->states.is_rep_G1[state];
price = GET_PRICE_1(enc->rc, rep_G0_prob);
if (rep_index == 1) {
price += GET_PRICE_0(enc->rc, rep_G1_prob);
}
else {
unsigned rep_G2_prob = enc->states.is_rep_G2[state];
price += GET_PRICE_1(enc->rc, rep_G1_prob);
price += GET_PRICE(enc->enc->rc, rep_G2_prob, (U32)(rep_index) - 2);
}
}
return price;
}
static unsigned GetRepMatch0Price(FL2_lzmaEncoderCtx* enc, size_t len, size_t state, size_t pos_state)
{
unsigned rep_G0_prob = enc->states.is_rep_G0[state];
unsigned rep0_long_prob = enc->states.is_rep0_long[state][pos_state];
return enc->states.rep_len_states.prices[pos_state][len - kMatchLenMin]
+ GET_PRICE_0(enc->rc, rep_G0_prob)
+ GET_PRICE_1(enc->rc, rep0_long_prob);
}
static unsigned GetLiteralPriceMatched(RangeEncoder* rc, const Probability *prob_table, U32 symbol, unsigned match_byte)
{
unsigned price = 0;
unsigned offs = 0x100;
symbol |= 0x100;
do {
match_byte <<= 1;
price += GET_PRICE(enc->rc, prob_table[offs + (match_byte & offs) + (symbol >> 8)], (symbol >> 7) & 1);
symbol <<= 1;
offs &= ~(match_byte ^ symbol);
} while (symbol < 0x10000);
return price;
}
static void EncodeLiteral(FL2_lzmaEncoderCtx* enc, size_t index, U32 symbol, unsigned prev_symbol)
{
EncodeBit0(&enc->rc, &enc->states.is_match[enc->states.state][index & enc->pos_mask]);
enc->states.state = LiteralNextState(enc->states.state);
{ Probability* prob_table = GetLiteralProbs(enc, index, prev_symbol);
symbol |= 0x100;
do {
EncodeBit(&enc->rc, prob_table + (symbol >> 8), symbol & (1 << 7));
symbol <<= 1;
} while (symbol < 0x10000);
}
}
static void EncodeLiteralMatched(FL2_lzmaEncoderCtx* enc, const BYTE* data_block, size_t index, U32 symbol)
{
EncodeBit0(&enc->rc, &enc->states.is_match[enc->states.state][index & enc->pos_mask]);
enc->states.state = LiteralNextState(enc->states.state);
{ unsigned match_symbol = data_block[index - enc->states.reps[0] - 1];
Probability* prob_table = GetLiteralProbs(enc, index, data_block[index - 1]);
unsigned offset = 0x100;
symbol |= 0x100;
do {
match_symbol <<= 1;
size_t prob_index = offset + (match_symbol & offset) + (symbol >> 8);
EncodeBit(&enc->rc, prob_table + prob_index, symbol & (1 << 7));
symbol <<= 1;
offset &= ~(match_symbol ^ symbol);
} while (symbol < 0x10000);
}
}
HINT_INLINE
void EncodeLiteralBuf(FL2_lzmaEncoderCtx* enc, const BYTE* data_block, size_t index)
{
U32 symbol = data_block[index];
if (IsCharState(enc->states.state)) {
unsigned prev_symbol = data_block[index - 1];
EncodeLiteral(enc, index, symbol, prev_symbol);
}
else {
EncodeLiteralMatched(enc, data_block, index, symbol);
}
}
static size_t RMF_bitpackExtendMatch(const BYTE* const data,
const U32* const table,
ptrdiff_t const start_index,
ptrdiff_t limit,
U32 const link,
size_t const length)
{
ptrdiff_t end_index = start_index + length;
ptrdiff_t dist = start_index - link;
if (limit > start_index + (ptrdiff_t)kMatchLenMax)
limit = start_index + kMatchLenMax;
while (end_index < limit && end_index - (table[end_index] & RADIX_LINK_MASK) == dist) {
end_index += table[end_index] >> RADIX_LINK_BITS;
}
if (end_index >= limit) {
DEBUGLOG(7, "RMF_bitpackExtendMatch : pos %u, link %u, init length %u, full length %u", (U32)start_index, link, (U32)length, (U32)(limit - start_index));
return limit - start_index;
}
while (end_index < limit && data[end_index - dist] == data[end_index]) {
++end_index;
}
DEBUGLOG(7, "RMF_bitpackExtendMatch : pos %u, link %u, init length %u, full length %u", (U32)start_index, link, (U32)length, (U32)(end_index - start_index));
return end_index - start_index;
}
#define GetMatchLink(table, index) ((const RMF_unit*)(table))[(index) >> UNIT_BITS].links[(index) & UNIT_MASK]
#define GetMatchLength(table, index) ((const RMF_unit*)(table))[(index) >> UNIT_BITS].lengths[(index) & UNIT_MASK]
static size_t RMF_structuredExtendMatch(const BYTE* const data,
const U32* const table,
ptrdiff_t const start_index,
ptrdiff_t limit,
U32 const link,
size_t const length)
{
ptrdiff_t end_index = start_index + length;
ptrdiff_t dist = start_index - link;
if (limit > start_index + (ptrdiff_t)kMatchLenMax)
limit = start_index + kMatchLenMax;
while (end_index < limit && end_index - GetMatchLink(table, end_index) == dist) {
end_index += GetMatchLength(table, end_index);
}
if (end_index >= limit) {
DEBUGLOG(7, "RMF_structuredExtendMatch : pos %u, link %u, init length %u, full length %u", (U32)start_index, link, (U32)length, (U32)(limit - start_index));
return limit - start_index;
}
while (end_index < limit && data[end_index - dist] == data[end_index]) {
++end_index;
}
DEBUGLOG(7, "RMF_structuredExtendMatch : pos %u, link %u, init length %u, full length %u", (U32)start_index, link, (U32)length, (U32)(end_index - start_index));
return end_index - start_index;
}
FORCE_INLINE_TEMPLATE
Match FL2_radixGetMatch(FL2_dataBlock block,
FL2_matchTable* tbl,
unsigned max_depth,
int structTbl,
size_t index)
{
if (structTbl)
{
Match match;
U32 link = GetMatchLink(tbl->table, index);
size_t length;
size_t dist;
match.length = 0;
if (link == RADIX_NULL_LINK)
return match;
length = GetMatchLength(tbl->table, index);
dist = index - link - 1;
if (length > block.end - index) {
match.length = (U32)(block.end - index);
}
else if (length == max_depth
|| length == STRUCTURED_MAX_LENGTH /* from HandleRepeat */)
{
match.length = (U32)RMF_structuredExtendMatch(block.data, tbl->table, index, block.end, link, length);
}
else {
match.length = (U32)length;
}
match.dist = (U32)dist;
return match;
}
else {
Match match;
U32 link = tbl->table[index];
size_t length;
size_t dist;
match.length = 0;
if (link == RADIX_NULL_LINK)
return match;
length = link >> RADIX_LINK_BITS;
link &= RADIX_LINK_MASK;
dist = index - link - 1;
if (length > block.end - index) {
match.length = (U32)(block.end - index);
}
else if (length == max_depth
|| length == BITPACK_MAX_LENGTH /* from HandleRepeat */)
{
match.length = (U32)RMF_bitpackExtendMatch(block.data, tbl->table, index, block.end, link, length);
}
else {
match.length = (U32)length;
}
match.dist = (U32)dist;
return match;
}
}
FORCE_INLINE_TEMPLATE
Match FL2_radixGetNextMatch(FL2_dataBlock block,
FL2_matchTable* tbl,
unsigned max_depth,
int structTbl,
size_t index)
{
if (structTbl)
{
Match match;
U32 link = GetMatchLink(tbl->table, index);
size_t length;
size_t dist;
match.length = 0;
if (link == RADIX_NULL_LINK)
return match;
length = GetMatchLength(tbl->table, index);
dist = index - link - 1;
if (link - 1 == GetMatchLink(tbl->table, index - 1)) {
/* same as the previous match, one byte shorter */
return match;
}
if (length > block.end - index) {
match.length = (U32)(block.end - index);
}
else if (length == max_depth
|| length == STRUCTURED_MAX_LENGTH /* from HandleRepeat */)
{
match.length = (U32)RMF_structuredExtendMatch(block.data, tbl->table, index, block.end, link, length);
}
else {
match.length = (U32)length;
}
match.dist = (U32)dist;
return match;
}
else {
Match match;
U32 link = tbl->table[index];
size_t length;
size_t dist;
match.length = 0;
if (link == RADIX_NULL_LINK)
return match;
length = link >> RADIX_LINK_BITS;
link &= RADIX_LINK_MASK;
dist = index - link - 1;
if (link - 1 == (tbl->table[index - 1] & RADIX_LINK_MASK)) {
/* same distance, one byte shorter */
return match;
}
if (length > block.end - index) {
match.length = (U32)(block.end - index);
}
else if (length == max_depth
|| length == BITPACK_MAX_LENGTH /* from HandleRepeat */)
{
match.length = (U32)RMF_bitpackExtendMatch(block.data, tbl->table, index, block.end, link, length);
}
else {
match.length = (U32)length;
}
match.dist = (U32)dist;
return match;
}
}
static void LengthStates_SetPrices(RangeEncoder* rc, LengthStates* ls, size_t pos_state)
{
unsigned prob = ls->choice;
unsigned a0 = GET_PRICE_0(rc, prob);
unsigned a1 = GET_PRICE_1(rc, prob);
unsigned b0, b1;
size_t i = 0;
prob = ls->choice_2;
b0 = a1 + GET_PRICE_0(rc, prob);
b1 = a1 + GET_PRICE_1(rc, prob);
for (; i < kLenNumLowSymbols && i < ls->table_size; ++i) {
ls->prices[pos_state][i] = a0 + GetTreePrice(rc, ls->low + (pos_state << kLenNumLowBits), kLenNumLowBits, i);
}
for (; i < kLenNumLowSymbols + kLenNumMidSymbols && i < ls->table_size; ++i) {
ls->prices[pos_state][i] = b0 + GetTreePrice(rc, ls->mid + (pos_state << kLenNumMidBits), kLenNumMidBits, i - kLenNumLowSymbols);
}
for (; i < ls->table_size; ++i) {
ls->prices[pos_state][i] = b1 + GetTreePrice(rc, ls->high, kLenNumHighBits, i - kLenNumLowSymbols - kLenNumMidSymbols);
}
ls->counters[pos_state] = (unsigned)(ls->table_size);
}
static void EncodeLength(FL2_lzmaEncoderCtx* enc, LengthStates* len_prob_table, unsigned len, size_t pos_state)
{
len -= kMatchLenMin;
if (len < kLenNumLowSymbols) {
EncodeBit0(&enc->rc, &len_prob_table->choice);
EncodeBitTree(&enc->rc, len_prob_table->low + (pos_state << kLenNumLowBits), kLenNumLowBits, len);
}
else {
EncodeBit1(&enc->rc, &len_prob_table->choice);
if (len < kLenNumLowSymbols + kLenNumMidSymbols) {
EncodeBit0(&enc->rc, &len_prob_table->choice_2);
EncodeBitTree(&enc->rc, len_prob_table->mid + (pos_state << kLenNumMidBits), kLenNumMidBits, len - kLenNumLowSymbols);
}
else {
EncodeBit1(&enc->rc, &len_prob_table->choice_2);
EncodeBitTree(&enc->rc, len_prob_table->high, kLenNumHighBits, len - kLenNumLowSymbols - kLenNumMidSymbols);
}
}
if (enc->strategy != FL2_fast && --len_prob_table->counters[pos_state] == 0) {
LengthStates_SetPrices(&enc->rc, len_prob_table, pos_state);
}
}
static void EncodeRepMatch(FL2_lzmaEncoderCtx* enc, unsigned len, unsigned rep, size_t pos_state)
{
DEBUGLOG(7, "EncodeRepMatch : length %u, rep %u", len, rep);
EncodeBit1(&enc->rc, &enc->states.is_match[enc->states.state][pos_state]);
EncodeBit1(&enc->rc, &enc->states.is_rep[enc->states.state]);
if (rep == 0) {
EncodeBit0(&enc->rc, &enc->states.is_rep_G0[enc->states.state]);
EncodeBit(&enc->rc, &enc->states.is_rep0_long[enc->states.state][pos_state], ((len == 1) ? 0 : 1));
}
else {
U32 distance = enc->states.reps[rep];
EncodeBit1(&enc->rc, &enc->states.is_rep_G0[enc->states.state]);
if (rep == 1) {
EncodeBit0(&enc->rc, &enc->states.is_rep_G1[enc->states.state]);
}
else {
EncodeBit1(&enc->rc, &enc->states.is_rep_G1[enc->states.state]);
EncodeBit(&enc->rc, &enc->states.is_rep_G2[enc->states.state], rep - 2);
if (rep == 3) {
enc->states.reps[3] = enc->states.reps[2];
}
enc->states.reps[2] = enc->states.reps[1];
}
enc->states.reps[1] = enc->states.reps[0];
enc->states.reps[0] = distance;
}
if (len == 1) {
enc->states.state = ShortRepNextState(enc->states.state);
}
else {
EncodeLength(enc, &enc->states.rep_len_states, len, pos_state);
enc->states.state = RepNextState(enc->states.state);
}
}
/* *****************************************/
/* Distance slot functions based on fastpos.h from XZ*/
HINT_INLINE
unsigned FastDistShift(unsigned n)
{
return n * (kFastDistBits - 1);
}
HINT_INLINE
unsigned FastDistResult(U32 dist, unsigned n)
{
return distance_table[dist >> FastDistShift(n)]
+ 2 * FastDistShift(n);
}
static size_t GetDistSlot(U32 distance)
{
U32 limit = 1UL << kFastDistBits;
/* If it is small enough, we can pick the result directly from */
/* the precalculated table. */
if (distance < limit) {
return distance_table[distance];
}
limit <<= FastDistShift(1);
if (distance < limit) {
return FastDistResult(distance, 1);
}
return FastDistResult(distance, 2);
}
/* **************************************** */
static void EncodeNormalMatch(FL2_lzmaEncoderCtx* enc, unsigned len, U32 dist, size_t pos_state)
{
DEBUGLOG(7, "EncodeNormalMatch : length %u, dist %u", len, dist);
EncodeBit1(&enc->rc, &enc->states.is_match[enc->states.state][pos_state]);
EncodeBit0(&enc->rc, &enc->states.is_rep[enc->states.state]);
enc->states.state = MatchNextState(enc->states.state);
EncodeLength(enc, &enc->states.len_states, len, pos_state);
{ size_t dist_slot = GetDistSlot(dist);
EncodeBitTree(&enc->rc, enc->states.dist_slot_encoders[GetLenToDistState(len)], kNumPosSlotBits, (unsigned)(dist_slot));
if (dist_slot >= kStartPosModelIndex) {
unsigned footerBits = ((unsigned)(dist_slot >> 1) - 1);
size_t base = ((2 | (dist_slot & 1)) << footerBits);
unsigned posReduced = (unsigned)(dist - base);
if (dist_slot < kEndPosModelIndex) {
EncodeBitTreeReverse(&enc->rc, enc->states.dist_encoders + base - dist_slot - 1, footerBits, posReduced);
}
else {
EncodeDirect(&enc->rc, posReduced >> kNumAlignBits, footerBits - kNumAlignBits);
EncodeBitTreeReverse(&enc->rc, enc->states.dist_align_encoders, kNumAlignBits, posReduced & kAlignMask);
++enc->align_price_count;
}
}
}
enc->states.reps[3] = enc->states.reps[2];
enc->states.reps[2] = enc->states.reps[1];
enc->states.reps[1] = enc->states.reps[0];
enc->states.reps[0] = dist;
++enc->match_price_count;
}
#if defined(_MSC_VER)
# pragma warning(disable : 4701) /* disable: C4701: potentially uninitialized local variable */
#endif
FORCE_INLINE_TEMPLATE
size_t EncodeChunkFast(FL2_lzmaEncoderCtx* enc,
FL2_dataBlock const block,
FL2_matchTable* tbl,
int structTbl,
size_t index,
size_t uncompressed_end)
{
size_t const pos_mask = enc->pos_mask;
size_t prev = index;
unsigned search_depth = tbl->params.depth;
while (index < uncompressed_end && enc->rc.out_index < enc->rc.chunk_size)
{
size_t max_len;
const BYTE* data;
/* Table of distance restrictions for short matches */
static const U32 max_dist_table[] = { 0, 0, 0, 1 << 6, 1 << 14 };
/* Get a match from the table, extended to its full length */
Match bestMatch = FL2_radixGetMatch(block, tbl, search_depth, structTbl, index);
if (bestMatch.length < kMatchLenMin) {
++index;
continue;
}
/* Use if near enough */
if (bestMatch.length >= 5 || bestMatch.dist < max_dist_table[bestMatch.length]) {
bestMatch.dist += kNumReps;
}
else {
bestMatch.length = 0;
}
max_len = MIN(kMatchLenMax, block.end - index);
data = block.data + index;
{ Match bestRep;
Match repMatch;
bestRep.length = 0;
for (repMatch.dist = 0; repMatch.dist < kNumReps; ++repMatch.dist) {
const BYTE *data_2 = data - enc->states.reps[repMatch.dist] - 1;
if (MEM_read16(data) != MEM_read16(data_2)) {
continue;
}
repMatch.length = (U32)(ZSTD_count(data + 2, data_2 + 2, data + max_len) + 2);
if (repMatch.length >= max_len) {
bestMatch = repMatch;
goto _encode;
}
if (repMatch.length > bestRep.length) {
bestRep = repMatch;
}
}
if (bestMatch.length >= max_len)
goto _encode;
if (bestRep.length >= 2) {
int const gain2 = (int)(bestRep.length * 3 - bestRep.dist);
int const gain1 = (int)(bestMatch.length * 3 - ZSTD_highbit32(bestMatch.dist + 1) + 1);
if (gain2 > gain1) {
DEBUGLOG(7, "Replace match (%u, %u) with rep (%u, %u)", bestMatch.length, bestMatch.dist, bestRep.length, bestRep.dist);
bestMatch = bestRep;
}
}
}
if (bestMatch.length < kMatchLenMin) {
++index;
continue;
}
for (size_t next = index + 1; bestMatch.length < kMatchLenMax && next < uncompressed_end; ++next) {
/* lazy matching scheme from ZSTD */
Match next_match = FL2_radixGetNextMatch(block, tbl, search_depth, structTbl, next);
if (next_match.length >= kMatchLenMin) {
Match bestRep;
Match repMatch;
bestRep.length = 0;
data = block.data + next;
max_len = MIN(kMatchLenMax, block.end - next);
for (repMatch.dist = 0; repMatch.dist < kNumReps; ++repMatch.dist) {
const BYTE *data_2 = data - enc->states.reps[repMatch.dist] - 1;
if (MEM_read16(data) != MEM_read16(data_2)) {
continue;
}
repMatch.length = (U32)(ZSTD_count(data + 2, data_2 + 2, data + max_len) + 2);
if (repMatch.length > bestRep.length) {
bestRep = repMatch;
}
}
if (bestRep.length >= 3) {
int const gain2 = (int)(bestRep.length * 3 - bestRep.dist);
int const gain1 = (int)(bestMatch.length * 3 - ZSTD_highbit32((U32)bestMatch.dist + 1) + 1);
if (gain2 > gain1) {
DEBUGLOG(7, "Replace match (%u, %u) with rep (%u, %u)", bestMatch.length, bestMatch.dist, bestRep.length, bestRep.dist);
bestMatch = bestRep;
index = next;
}
}
if (next_match.length >= 3 && next_match.dist != bestMatch.dist) {
int const gain2 = (int)(next_match.length * 4 - ZSTD_highbit32((U32)next_match.dist + 1)); /* raw approx */
int const gain1 = (int)(bestMatch.length * 4 - ZSTD_highbit32((U32)bestMatch.dist + 1) + 4);
if (gain2 > gain1) {
DEBUGLOG(7, "Replace match (%u, %u) with match (%u, %u)", bestMatch.length, bestMatch.dist, next_match.length, next_match.dist + kNumReps);
bestMatch = next_match;
bestMatch.dist += kNumReps;
index = next;
continue;
}
}
}
if (next < uncompressed_end - 4) {
Match bestRep;
Match repMatch;
++next;
next_match = FL2_radixGetNextMatch(block, tbl, search_depth, structTbl, next);
if (next_match.length < 4)
break;
data = block.data + next;
max_len = MIN(kMatchLenMax, block.end - next);
bestRep.length = 0;
for (repMatch.dist = 0; repMatch.dist < kNumReps; ++repMatch.dist) {
const BYTE *data_2 = data - enc->states.reps[repMatch.dist] - 1;
if (MEM_read16(data) != MEM_read16(data_2)) {
continue;
}
repMatch.length = (U32)(ZSTD_count(data + 2, data_2 + 2, data + max_len) + 2);
if (repMatch.length > bestRep.length) {
bestRep = repMatch;
}
}
if (bestRep.length >= 4) {
int const gain2 = (int)(bestRep.length * 4 - (bestRep.dist >> 1));
int const gain1 = (int)(bestMatch.length * 4 - ZSTD_highbit32((U32)bestMatch.dist + 1) + 1);
if (gain2 > gain1) {
DEBUGLOG(7, "Replace match (%u, %u) with rep (%u, %u)", bestMatch.length, bestMatch.dist, bestRep.length, bestRep.dist);
bestMatch = bestRep;
index = next;
}
}
if (next_match.length >= 4 && next_match.dist != bestMatch.dist) {
int const gain2 = (int)(next_match.length * 4 - ZSTD_highbit32((U32)next_match.dist + 1));
int const gain1 = (int)(bestMatch.length * 4 - ZSTD_highbit32((U32)bestMatch.dist + 1) + 7);
if (gain2 > gain1) {
DEBUGLOG(7, "Replace match (%u, %u) with match (%u, %u)", bestMatch.length, bestMatch.dist, next_match.length, next_match.dist + kNumReps);
bestMatch = next_match;
bestMatch.dist += kNumReps;
index = next;
continue;
}
}
}
break;
}
_encode:
assert(index + bestMatch.length <= block.end);
while (prev < index && enc->rc.out_index < enc->rc.chunk_size) {
if (block.data[prev] == block.data[prev - enc->states.reps[0] - 1]) {
EncodeRepMatch(enc, 1, 0, prev & pos_mask);
}
else {
EncodeLiteralBuf(enc, block.data, prev);
}
++prev;
}
if (enc->rc.out_index >= enc->rc.chunk_size) {
break;
}
if(bestMatch.length >= kMatchLenMin) {
if (bestMatch.dist < kNumReps) {
EncodeRepMatch(enc, bestMatch.length, bestMatch.dist, index & pos_mask);
}
else {
EncodeNormalMatch(enc, bestMatch.length, bestMatch.dist - kNumReps, index & pos_mask);
}
index += bestMatch.length;
prev = index;
}
}
while (prev < index && enc->rc.out_index < enc->rc.chunk_size) {
if (block.data[prev] == block.data[prev - enc->states.reps[0] - 1]) {
EncodeRepMatch(enc, 1, 0, prev & pos_mask);
}
else {
EncodeLiteralBuf(enc, block.data, prev);
}
++prev;
}
Flush(&enc->rc);
return prev;
}
/* Reverse the direction of the linked list generated by the optimal parser */
static void ReverseOptimalChain(OptimalNode* opt_buf, size_t cur)
{
size_t next_index = opt_buf[cur].prev_index;
U32 next_dist = opt_buf[cur].prev_dist;
do
{
if (opt_buf[cur].is_combination)
{
MakeAsLiteral(opt_buf[next_index]);
opt_buf[next_index].prev_index = (unsigned)(next_index - 1);
if (opt_buf[cur].prev_2)
{
opt_buf[next_index - 1].is_combination = 0;
opt_buf[next_index - 1].prev_index = opt_buf[cur].prev_index_2;
opt_buf[next_index - 1].prev_dist = opt_buf[cur].prev_dist_2;
}
}
{ U32 temp = opt_buf[next_index].prev_dist;
opt_buf[next_index].prev_dist = next_dist;
next_dist = temp;
}
{ size_t prev_index = next_index;
next_index = opt_buf[prev_index].prev_index;
opt_buf[prev_index].prev_index = (unsigned)(cur);
cur = prev_index;
}
} while (cur != 0);
}
static unsigned GetLiteralPrice(FL2_lzmaEncoderCtx* enc, size_t index, size_t state, unsigned prev_symbol, U32 symbol, unsigned match_byte)
{
const Probability* prob_table = GetLiteralProbs(enc, index, prev_symbol);
if (IsCharState(state)) {
unsigned price = 0;
symbol |= 0x100;
do {
price += GET_PRICE(enc->rc, prob_table[symbol >> 8], (symbol >> 7) & 1);
symbol <<= 1;
} while (symbol < 0x10000);
return price;
}
return GetLiteralPriceMatched(&enc->rc, prob_table, symbol, match_byte);
}
static void HashReset(FL2_lzmaEncoderCtx* enc, unsigned dictionary_bits_3)
{
enc->hash_dict_3 = (ptrdiff_t)1 << dictionary_bits_3;
enc->chain_mask_3 = enc->hash_dict_3 - 1;
memset(enc->hash_buf->table_3, 0xFF, sizeof(enc->hash_buf->table_3));
}
static int HashCreate(FL2_lzmaEncoderCtx* enc, unsigned dictionary_bits_3)
{
DEBUGLOG(3, "Create hash chain : dict bits %u", dictionary_bits_3);
if (enc->hash_buf) {
free(enc->hash_buf);
}
enc->hash_alloc_3 = (ptrdiff_t)1 << dictionary_bits_3;
enc->hash_buf = malloc(sizeof(HashChains) + (enc->hash_alloc_3 - 1) * sizeof(S32));
if (enc->hash_buf == NULL)
return 1;
HashReset(enc, dictionary_bits_3);
return 0;
}
/* Create a hash chain for hybrid mode */
int FL2_lzma2HashAlloc(FL2_lzmaEncoderCtx* enc, const FL2_lzma2Parameters* options)
{
if (enc->strategy == FL2_ultra && enc->hash_alloc_3 < ((ptrdiff_t)1 << options->second_dict_bits)) {
return HashCreate(enc, options->second_dict_bits);
}
return 0;
}
#define GET_HASH_3(data) ((((MEM_readLE32(data)) << 8) * 506832829U) >> (32 - kHash3Bits))
HINT_INLINE
size_t HashGetMatches(FL2_lzmaEncoderCtx* enc, const FL2_dataBlock block,
ptrdiff_t index,
size_t length_limit,
Match match)
{
ptrdiff_t const hash_dict_3 = enc->hash_dict_3;
const BYTE* data = block.data;
HashChains* tbl = enc->hash_buf;
ptrdiff_t const chain_mask_3 = enc->chain_mask_3;
size_t max_len;
ptrdiff_t first_3;
enc->match_count = 0;
enc->hash_prev_index = MAX(enc->hash_prev_index, index - hash_dict_3);
/* Update hash tables and chains for any positions that were skipped */
while (++enc->hash_prev_index < index) {
size_t hash = GET_HASH_3(data + enc->hash_prev_index);
tbl->hash_chain_3[enc->hash_prev_index & chain_mask_3] = tbl->table_3[hash];
tbl->table_3[hash] = (S32)enc->hash_prev_index;
}
data += index;
max_len = 2;
{ size_t hash = GET_HASH_3(data);
first_3 = tbl->table_3[hash];
tbl->table_3[hash] = (S32)(index);
}
if (first_3 >= 0) {
int cycles = enc->match_cycles;
ptrdiff_t end_index = index - (((ptrdiff_t)match.dist < hash_dict_3) ? match.dist : hash_dict_3);
ptrdiff_t match_3 = first_3;
if (match_3 >= end_index) {
do {
--cycles;
const BYTE* data_2 = block.data + match_3;
size_t len_test = ZSTD_count(data + 1, data_2 + 1, data + length_limit) + 1;
if (len_test > max_len) {
enc->matches[enc->match_count].length = (U32)len_test;
enc->matches[enc->match_count].dist = (U32)(index - match_3 - 1);
++enc->match_count;
max_len = len_test;
if (len_test >= length_limit) {
break;
}
}
if (cycles <= 0)
break;
match_3 = tbl->hash_chain_3[match_3 & chain_mask_3];
} while (match_3 >= end_index);
}
}
tbl->hash_chain_3[index & chain_mask_3] = (S32)first_3;
if ((unsigned)(max_len) < match.length) {
enc->matches[enc->match_count] = match;
++enc->match_count;
return match.length;
}
return max_len;
}
#if defined(_MSC_VER)
# pragma warning(disable : 4701) /* disable: C4701: potentially uninitialized local variable */
#endif
/* The speed of this function is critical and the sections have so many variables
* in common that breaking it up would be inefficient.
* For each position cur, starting at 1, check some or all possible
* encoding choices - a literal, 1-byte rep 0 match, all rep match lengths, and
* all match lengths at available distances. It also checks the combined
* sequences literal+rep0, rep+rep0 and match+rep0.
* If is_hybrid != 0, this method works in hybrid mode, using the
* hash chain to find shorter matches at near distances. */
FORCE_INLINE_TEMPLATE
size_t OptimalParse(FL2_lzmaEncoderCtx* const enc, const FL2_dataBlock block,
Match match,
size_t const index,
size_t const cur,
size_t len_end,
int const is_hybrid,
U32* const reps)
{
OptimalNode* cur_opt = &enc->opt_buf[cur];
size_t prev_index = cur_opt->prev_index;
size_t state = enc->opt_buf[prev_index].state;
size_t const pos_mask = enc->pos_mask;
size_t pos_state = (index & pos_mask);
const BYTE* data = block.data + index;
size_t const fast_length = enc->fast_length;
size_t bytes_avail;
size_t max_length;
size_t start_len;
U32 match_price;
U32 rep_match_price;
Probability is_rep_prob;
if (cur_opt->is_combination) {
--prev_index;
if (cur_opt->prev_2) {
state = enc->opt_buf[cur_opt->prev_index_2].state;
if (cur_opt->prev_dist_2 < kNumReps) {
state = RepNextState(state);
}
else {
state = MatchNextState(state);
}
}
else {
state = enc->opt_buf[prev_index].state;
}
state = LiteralNextState(state);
}
if (prev_index == cur - 1) {
if (cur_opt->prev_dist == 0) {
state = ShortRepNextState(state);
}
else {
state = LiteralNextState(state);
}
}
else {
size_t dist;
if (cur_opt->is_combination && cur_opt->prev_2) {
prev_index = cur_opt->prev_index_2;
dist = cur_opt->prev_dist_2;
state = RepNextState(state);
}
else {
dist = cur_opt->prev_dist;
if (dist < kNumReps) {
state = RepNextState(state);
}
else {
state = MatchNextState(state);
}
}
const OptimalNode* prev_opt = &enc->opt_buf[prev_index];
if (dist < kNumReps) {
size_t i = 1;
reps[0] = prev_opt->reps[dist];
for (; i <= dist; ++i) {
reps[i] = prev_opt->reps[i - 1];
}
for (; i < kNumReps; ++i) {
reps[i] = prev_opt->reps[i];
}
}
else {
reps[0] = (U32)(dist - kNumReps);
for (size_t i = 1; i < kNumReps; ++i) {
reps[i] = prev_opt->reps[i - 1];
}
}
}
cur_opt->state = state;
memcpy(cur_opt->reps, reps, sizeof(cur_opt->reps));
is_rep_prob = enc->states.is_rep[state];
{ Probability is_match_prob = enc->states.is_match[state][pos_state];
unsigned cur_byte = *data;
unsigned match_byte = *(data - reps[0] - 1);
U32 cur_price = cur_opt->price;
U32 cur_and_lit_price = cur_price + GET_PRICE_0(rc, is_match_prob) +
GetLiteralPrice(enc, index, state, data[-1], cur_byte, match_byte);
OptimalNode* next_opt = &enc->opt_buf[cur + 1];
BYTE next_is_char = 0;
/* Try literal */
if (cur_and_lit_price < next_opt->price) {
next_opt->price = cur_and_lit_price;
next_opt->prev_index = (unsigned)cur;
MakeAsLiteral(*next_opt);
next_is_char = 1;
}
match_price = cur_price + GET_PRICE_1(rc, is_match_prob);
rep_match_price = match_price + GET_PRICE_1(rc, is_rep_prob);
if (match_byte == cur_byte) {
/* Try 1-byte rep0 */
U32 short_rep_price = rep_match_price + GetRepLen1Price(enc, state, pos_state);
if (short_rep_price <= next_opt->price) {
next_opt->price = short_rep_price;
next_opt->prev_index = (unsigned)cur;
MakeAsShortRep(*next_opt);
next_is_char = 1;
}
}
bytes_avail = MIN(block.end - index, kOptimizerBufferSize - 1 - cur);
if (bytes_avail < 2)
return len_end;
if (!next_is_char && match_byte != cur_byte) {
/* Try literal + rep0 */
const BYTE *data_2 = data - reps[0];
size_t limit = MIN(bytes_avail - 1, fast_length);
size_t len_test_2 = ZSTD_count(data + 1, data_2, data + 1 + limit);
if (len_test_2 >= 2) {
size_t state_2 = LiteralNextState(state);
size_t pos_state_next = (index + 1) & pos_mask;
U32 next_rep_match_price = cur_and_lit_price +
GET_PRICE_1(rc, enc->states.is_match[state_2][pos_state_next]) +
GET_PRICE_1(rc, enc->states.is_rep[state_2]);
size_t offset = cur + 1 + len_test_2;
U32 cur_and_len_price = next_rep_match_price + GetRepMatch0Price(enc, len_test_2, state_2, pos_state_next);
if (cur_and_len_price < enc->opt_buf[offset].price) {
len_end = MAX(len_end, offset);
enc->opt_buf[offset].price = cur_and_len_price;
enc->opt_buf[offset].prev_index = (unsigned)(cur + 1);
enc->opt_buf[offset].prev_dist = 0;
enc->opt_buf[offset].is_combination = 1;
enc->opt_buf[offset].prev_2 = 0;
}
}
}
}
max_length = MIN(bytes_avail, fast_length);
start_len = 2;
if (match.length > 0) {
size_t len_test;
size_t len;
U32 cur_rep_price;
for (size_t rep_index = 0; rep_index < kNumReps; ++rep_index) {
const BYTE *data_2 = data - reps[rep_index] - 1;
if (MEM_read16(data) != MEM_read16(data_2))
continue;
len_test = ZSTD_count(data + 2, data_2 + 2, data + max_length) + 2;
len_end = MAX(len_end, cur + len_test);
cur_rep_price = rep_match_price + GetRepPrice(enc, rep_index, state, pos_state);
len = 2;
/* Try rep match */
do {
U32 cur_and_len_price = cur_rep_price + enc->states.rep_len_states.prices[pos_state][len - kMatchLenMin];
OptimalNode* opt = &enc->opt_buf[cur + len];
if (cur_and_len_price < opt->price) {
opt->price = cur_and_len_price;
opt->prev_index = (unsigned)cur;
opt->prev_dist = (U32)(rep_index);
opt->is_combination = 0;
}
} while (++len <= len_test);
if (rep_index == 0) {
/* Save time by exluding normal matches not longer than the rep */
start_len = len_test + 1;
}
if (is_hybrid && len_test + 3 <= bytes_avail && MEM_read16(data + len_test + 1) == MEM_read16(data_2 + len_test + 1)) {
/* Try rep + literal + rep0 */
size_t len_test_2 = ZSTD_count(data + len_test + 3,
data_2 + len_test + 3,
data + MIN(len_test + 1 + fast_length, bytes_avail)) + 2;
size_t state_2 = RepNextState(state);
size_t pos_state_next = (index + len_test) & pos_mask;
U32 rep_lit_rep_total_price =
cur_rep_price + enc->states.rep_len_states.prices[pos_state][len_test - kMatchLenMin] +
GET_PRICE_0(rc, enc->states.is_match[state_2][pos_state_next]) +
GetLiteralPriceMatched(&enc->rc, GetLiteralProbs(enc, index + len_test, data[len_test - 1]),
data[len_test], data_2[len_test]);
size_t offset;
state_2 = LiteralNextState(state_2);
pos_state_next = (index + len_test + 1) & pos_mask;
rep_lit_rep_total_price +=
GET_PRICE_1(rc, enc->states.is_match[state_2][pos_state_next]) +
GET_PRICE_1(rc, enc->states.is_rep[state_2]);
offset = cur + len_test + 1 + len_test_2;
rep_lit_rep_total_price += GetRepMatch0Price(enc, len_test_2, state_2, pos_state_next);
if (rep_lit_rep_total_price < enc->opt_buf[offset].price) {
len_end = MAX(len_end, offset);
enc->opt_buf[offset].price = rep_lit_rep_total_price;
enc->opt_buf[offset].prev_index = (unsigned)(cur + len_test + 1);
enc->opt_buf[offset].prev_dist = 0;
enc->opt_buf[offset].is_combination = 1;
enc->opt_buf[offset].prev_2 = 1;
enc->opt_buf[offset].prev_index_2 = (unsigned)cur;
enc->opt_buf[offset].prev_dist_2 = (U32)(rep_index);
}
}
}
}
if (match.length >= start_len && max_length >= start_len) {
/* Try normal match */
U32 normal_match_price = match_price + GET_PRICE_0(rc, is_rep_prob);
if (!is_hybrid) {
/* Normal mode - single match */
size_t length = MIN(match.length, max_length);
size_t cur_dist = match.dist;
size_t dist_slot = GetDistSlot(match.dist);
size_t len_test = length;
len_end = MAX(len_end, cur + length);
/* Pre-load rep0 data bytes */
/* unsigned rep_0_bytes = MEM_read16(data - cur_dist + length); */
for (; len_test >= start_len; --len_test) {
OptimalNode *opt;
U32 cur_and_len_price = normal_match_price + enc->states.len_states.prices[pos_state][len_test - kMatchLenMin];
size_t len_to_dist_state = GetLenToDistState(len_test);
if (cur_dist < kNumFullDistances) {
cur_and_len_price += enc->distance_prices[len_to_dist_state][cur_dist];
}
else {
cur_and_len_price += enc->dist_slot_prices[len_to_dist_state][dist_slot] + enc->align_prices[cur_dist & kAlignMask];
}
opt = &enc->opt_buf[cur + len_test];
if (cur_and_len_price < opt->price) {
opt->price = cur_and_len_price;
opt->prev_index = (unsigned)cur;
opt->prev_dist = (U32)(cur_dist + kNumReps);
opt->is_combination = 0;
}
else break;
}
}
else {
/* Hybrid mode */
size_t main_len;
ptrdiff_t match_index;
ptrdiff_t start_match;
match.length = MIN(match.length, (U32)max_length);
if (match.length < 3 || match.dist < 256) {
enc->matches[0] = match;
enc->match_count = 1;
main_len = match.length;
}
else {
main_len = HashGetMatches(enc, block, index, max_length, match);
}
match_index = enc->match_count - 1;
if (main_len == max_length
&& match_index > 0
&& enc->matches[match_index - 1].length == main_len)
{
--match_index;
}
len_end = MAX(len_end, cur + main_len);
start_match = 0;
while (start_len > enc->matches[start_match].length) {
++start_match;
}
for (; match_index >= start_match; --match_index) {
size_t len_test = enc->matches[match_index].length;
size_t cur_dist = enc->matches[match_index].dist;
size_t dist_slot = GetDistSlot((U32)cur_dist);
U32 cur_and_len_price;
size_t base_len = (match_index > start_match) ? enc->matches[match_index - 1].length + 1 : start_len;
unsigned rep_0_bytes = MEM_read16(data - cur_dist + len_test);
for (; len_test >= base_len; --len_test) {
size_t len_to_dist_state;
OptimalNode *opt;
cur_and_len_price = normal_match_price + enc->states.len_states.prices[pos_state][len_test - kMatchLenMin];
len_to_dist_state = GetLenToDistState(len_test);
if (cur_dist < kNumFullDistances) {
cur_and_len_price += enc->distance_prices[len_to_dist_state][cur_dist];
}
else {
cur_and_len_price += enc->dist_slot_prices[len_to_dist_state][dist_slot] + enc->align_prices[cur_dist & kAlignMask];
}
opt = &enc->opt_buf[cur + len_test];
if (cur_and_len_price < opt->price) {
opt->price = cur_and_len_price;
opt->prev_index = (unsigned)cur;
opt->prev_dist = (U32)(cur_dist + kNumReps);
opt->is_combination = 0;
}
else if(len_test < main_len)
break;
if (len_test == enc->matches[match_index].length) {
size_t rep_0_pos = len_test + 1;
if (rep_0_pos + 2 <= bytes_avail && rep_0_bytes == MEM_read16(data + rep_0_pos)) {
/* Try match + literal + rep0 */
const BYTE *data_2 = data - cur_dist - 1;
size_t limit = MIN(rep_0_pos + fast_length, bytes_avail);
size_t len_test_2 = ZSTD_count(data + rep_0_pos + 2, data_2 + rep_0_pos + 2, data + limit) + 2;
size_t state_2 = MatchNextState(state);
size_t pos_state_next = (index + len_test) & pos_mask;
U32 match_lit_rep_total_price = cur_and_len_price +
GET_PRICE_0(rc, enc->states.is_match[state_2][pos_state_next]) +
GetLiteralPriceMatched(&enc->rc, GetLiteralProbs(enc, index + len_test, data[len_test - 1]),
data[len_test], data_2[len_test]);
size_t offset;
state_2 = LiteralNextState(state_2);
pos_state_next = (pos_state_next + 1) & pos_mask;
match_lit_rep_total_price +=
GET_PRICE_1(rc, enc->states.is_match[state_2][pos_state_next]) +
GET_PRICE_1(rc, enc->states.is_rep[state_2]);
offset = cur + rep_0_pos + len_test_2;
match_lit_rep_total_price += GetRepMatch0Price(enc, len_test_2, state_2, pos_state_next);
if (match_lit_rep_total_price < enc->opt_buf[offset].price) {
len_end = MAX(len_end, offset);
enc->opt_buf[offset].price = match_lit_rep_total_price;
enc->opt_buf[offset].prev_index = (unsigned)(cur + rep_0_pos);
enc->opt_buf[offset].prev_dist = 0;
enc->opt_buf[offset].is_combination = 1;
enc->opt_buf[offset].prev_2 = 1;
enc->opt_buf[offset].prev_index_2 = (unsigned)cur;
enc->opt_buf[offset].prev_dist_2 = (U32)(cur_dist + kNumReps);
}
}
}
}
}
}
}
return len_end;
}
HINT_INLINE
void InitMatchesPos0(FL2_lzmaEncoderCtx* enc, const FL2_dataBlock block,
Match match,
size_t pos_state,
size_t len,
unsigned normal_match_price)
{
if ((unsigned)len <= match.length) {
size_t distance = match.dist;
size_t slot = GetDistSlot(match.dist);
/* Test every available length of the match */
do
{
unsigned cur_and_len_price = normal_match_price + enc->states.len_states.prices[pos_state][len - kMatchLenMin];
size_t len_to_dist_state = GetLenToDistState(len);
if (distance < kNumFullDistances) {
cur_and_len_price += enc->distance_prices[len_to_dist_state][distance];
}
else {
cur_and_len_price += enc->align_prices[distance & kAlignMask] + enc->dist_slot_prices[len_to_dist_state][slot];
}
if (cur_and_len_price < enc->opt_buf[len].price) {
enc->opt_buf[len].price = cur_and_len_price;
enc->opt_buf[len].prev_index = 0;
enc->opt_buf[len].prev_dist = (U32)(distance + kNumReps);
enc->opt_buf[len].is_combination = 0;
}
++len;
} while ((unsigned)len <= match.length);
}
}
static size_t InitMatchesPos0Best(FL2_lzmaEncoderCtx* enc, const FL2_dataBlock block,
Match match,
size_t index,
size_t len,
unsigned normal_match_price)
{
if (len <= match.length) {
size_t main_len;
size_t match_index;
size_t pos_state;
size_t distance;
size_t slot;
if (match.length < 3 || match.dist < 256) {
enc->matches[0] = match;
enc->match_count = 1;
main_len = match.length;
}
else {
main_len = HashGetMatches(enc, block, index, MIN(block.end - index, enc->fast_length), match);
}
match_index = 0;
while (len > enc->matches[match_index].length) {
++match_index;
}
pos_state = index & enc->pos_mask;
distance = enc->matches[match_index].dist;
slot = GetDistSlot(enc->matches[match_index].dist);
/* Test every available match length at the shortest distance. The buffer is sorted */
/* in order of increasing length, and therefore increasing distance too. */
for (;; ++len) {
unsigned cur_and_len_price = normal_match_price
+ enc->states.len_states.prices[pos_state][len - kMatchLenMin];
size_t len_to_dist_state = GetLenToDistState(len);
if (distance < kNumFullDistances) {
cur_and_len_price += enc->distance_prices[len_to_dist_state][distance];
}
else {
cur_and_len_price += enc->align_prices[distance & kAlignMask] + enc->dist_slot_prices[len_to_dist_state][slot];
}
if (cur_and_len_price < enc->opt_buf[len].price) {
enc->opt_buf[len].price = cur_and_len_price;
enc->opt_buf[len].prev_index = 0;
enc->opt_buf[len].prev_dist = (U32)(distance + kNumReps);
enc->opt_buf[len].is_combination = 0;
}
if (len == enc->matches[match_index].length) {
/* Run out of length for this match. Get the next if any. */
if (len == main_len) {
break;
}
++match_index;
distance = enc->matches[match_index].dist;
slot = GetDistSlot(enc->matches[match_index].dist);
}
}
return main_len;
}
return 0;
}
/* Test all available options at position 0 of the optimizer buffer.
* The prices at this point are all initialized to kInfinityPrice.
* This function must not be called at a position where no match is
* available. */
FORCE_INLINE_TEMPLATE
size_t InitOptimizerPos0(FL2_lzmaEncoderCtx* enc, const FL2_dataBlock block,
Match match,
size_t index,
int const is_hybrid,
U32* reps)
{
size_t max_length = MIN(block.end - index, kMatchLenMax);
const BYTE *data = block.data + index;
const BYTE *data_2;
size_t rep_max_index = 0;
size_t rep_lens[kNumReps];
/* Find any rep matches */
for (size_t i = 0; i < kNumReps; ++i) {
reps[i] = enc->states.reps[i];
data_2 = data - reps[i] - 1;
if (MEM_read16(data) != MEM_read16(data_2)) {
rep_lens[i] = 0;
continue;
}
rep_lens[i] = ZSTD_count(data + 2, data_2 + 2, data + max_length) + 2;
if (rep_lens[i] > rep_lens[rep_max_index]) {
rep_max_index = i;
}
}
if (rep_lens[rep_max_index] >= enc->fast_length) {
enc->opt_buf[0].prev_index = (unsigned)(rep_lens[rep_max_index]);
enc->opt_buf[0].prev_dist = (U32)(rep_max_index);
return 0;
}
if (match.length >= enc->fast_length) {
enc->opt_buf[0].prev_index = match.length;
enc->opt_buf[0].prev_dist = match.dist + kNumReps;
return 0;
}
{ unsigned cur_byte = *data;
unsigned match_byte = *(data - reps[0] - 1);
unsigned match_price;
unsigned normal_match_price;
unsigned rep_match_price;
size_t len;
size_t state = enc->states.state;
size_t pos_state = index & enc->pos_mask;
Probability is_match_prob = enc->states.is_match[state][pos_state];
Probability is_rep_prob = enc->states.is_rep[state];
enc->opt_buf[0].state = state;
/* Set the price for literal */
enc->opt_buf[1].price = GET_PRICE_0(rc, is_match_prob) +
GetLiteralPrice(enc, index, state, data[-1], cur_byte, match_byte);
MakeAsLiteral(enc->opt_buf[1]);
match_price = GET_PRICE_1(rc, is_match_prob);
rep_match_price = match_price + GET_PRICE_1(rc, is_rep_prob);
if (match_byte == cur_byte) {
/* Try 1-byte rep0 */
unsigned short_rep_price = rep_match_price + GetRepLen1Price(enc, state, pos_state);
if (short_rep_price < enc->opt_buf[1].price) {
enc->opt_buf[1].price = short_rep_price;
MakeAsShortRep(enc->opt_buf[1]);
}
}
memcpy(enc->opt_buf[0].reps, reps, sizeof(enc->opt_buf[0].reps));
enc->opt_buf[1].prev_index = 0;
/* Test the rep match prices */
for (size_t i = 0; i < kNumReps; ++i) {
unsigned price;
size_t rep_len = rep_lens[i];
if (rep_len < 2) {
continue;
}
price = rep_match_price + GetRepPrice(enc, i, state, pos_state);
/* Test every available length of the rep */
do {
unsigned cur_and_len_price = price + enc->states.rep_len_states.prices[pos_state][rep_len - kMatchLenMin];
if (cur_and_len_price < enc->opt_buf[rep_len].price) {
enc->opt_buf[rep_len].price = cur_and_len_price;
enc->opt_buf[rep_len].prev_index = 0;
enc->opt_buf[rep_len].prev_dist = (U32)(i);
enc->opt_buf[rep_len].is_combination = 0;
}
} while (--rep_len >= kMatchLenMin);
}
normal_match_price = match_price + GET_PRICE_0(rc, is_rep_prob);
len = (rep_lens[0] >= 2) ? rep_lens[0] + 1 : 2;
/* Test the match prices */
if (!is_hybrid) {
/* Normal mode */
InitMatchesPos0(enc, block, match, pos_state, len, normal_match_price);
return MAX(match.length, rep_lens[rep_max_index]);
}
else {
/* Hybrid mode */
size_t main_len = InitMatchesPos0Best(enc, block, match, index, len, normal_match_price);
return MAX(main_len, rep_lens[rep_max_index]);
}
}
}
FORCE_INLINE_TEMPLATE
size_t EncodeOptimumSequence(FL2_lzmaEncoderCtx* enc, const FL2_dataBlock block,
FL2_matchTable* tbl,
int const structTbl,
int const is_hybrid,
size_t start_index,
size_t uncompressed_end,
Match match)
{
size_t len_end = enc->len_end_max;
unsigned search_depth = tbl->params.depth;
do {
U32 reps[kNumReps];
size_t index;
size_t cur;
unsigned prev_index;
size_t i;
size_t const pos_mask = enc->pos_mask;
for (; (len_end & 3) != 0; --len_end) {
enc->opt_buf[len_end].price = kInfinityPrice;
}
for (; len_end >= 4; len_end -= 4) {
enc->opt_buf[len_end].price = kInfinityPrice;
enc->opt_buf[len_end - 1].price = kInfinityPrice;
enc->opt_buf[len_end - 2].price = kInfinityPrice;
enc->opt_buf[len_end - 3].price = kInfinityPrice;
}
index = start_index;
/* Set everything up at position 0 */
len_end = InitOptimizerPos0(enc, block, match, index, is_hybrid, reps);
match.length = 0;
cur = 1;
/* len_end == 0 if a match of fast_length was found */
if (len_end > 0) {
++index;
/* Lazy termination of the optimal parser. In the second half of the buffer */
/* a resolution within one byte is enough */
for (; cur < (len_end - cur / (kOptimizerBufferSize / 2U)); ++cur, ++index) {
if (enc->opt_buf[cur + 1].price < enc->opt_buf[cur].price)
continue;
match = FL2_radixGetMatch(block, tbl, search_depth, structTbl, index);
if (match.length >= enc->fast_length) {
break;
}
len_end = OptimalParse(enc, block, match, index, cur, len_end, is_hybrid, reps);
}
if (cur < len_end && match.length < enc->fast_length) {
/* Adjust the end point base on scaling up the price. */
cur += (enc->opt_buf[cur].price + enc->opt_buf[cur].price / cur) >= enc->opt_buf[cur + 1].price;
}
DEBUGLOG(6, "End optimal parse at %u", (U32)cur);
ReverseOptimalChain(enc->opt_buf, cur);
}
/* Encode the selections in the buffer */
prev_index = 0;
i = 0;
do {
unsigned len = enc->opt_buf[i].prev_index - prev_index;
prev_index = enc->opt_buf[i].prev_index;
if (len == 1 && enc->opt_buf[i].prev_dist == kNullDist)
{
EncodeLiteralBuf(enc, block.data, start_index + i);
}
else {
size_t match_index = start_index + i;
U32 dist = enc->opt_buf[i].prev_dist;
/* The last match will be truncated to fit in the optimal buffer so get the full length */
if (i + len >= kOptimizerBufferSize - 1 && dist >= kNumReps) {
Match lastmatch = FL2_radixGetMatch(block, tbl, search_depth, tbl->isStruct, match_index);
if (lastmatch.length > len) {
len = lastmatch.length;
dist = lastmatch.dist + kNumReps;
}
}
if (dist < kNumReps) {
EncodeRepMatch(enc, len, dist, match_index & pos_mask);
}
else {
EncodeNormalMatch(enc, len, dist - kNumReps, match_index & pos_mask);
}
}
i += len;
} while (i < cur);
start_index += i;
/* Do another round if there is a long match pending, because the reps must be checked */
/* and the match encoded. */
} while (match.length >= enc->fast_length && start_index < uncompressed_end && enc->rc.out_index < enc->rc.chunk_size);
enc->len_end_max = len_end;
return start_index;
}
static void UpdateLengthPrices(FL2_lzmaEncoderCtx* enc, LengthStates* len_states)
{
for (size_t pos_state = 0; pos_state <= enc->pos_mask; ++pos_state) {
LengthStates_SetPrices(&enc->rc, len_states, pos_state);
}
}
static void FillAlignPrices(FL2_lzmaEncoderCtx* enc)
{
for (size_t i = 0; i < kAlignTableSize; ++i) {
enc->align_prices[i] = GetReverseTreePrice(&enc->rc, enc->states.dist_align_encoders, kNumAlignBits, i);
}
enc->align_price_count = 0;
}
static void FillDistancesPrices(FL2_lzmaEncoderCtx* enc)
{
static const size_t kLastLenToPosState = kNumLenToPosStates - 1;
for (size_t i = kStartPosModelIndex; i < kNumFullDistances; ++i) {
size_t dist_slot = distance_table[i];
unsigned footerBits = (unsigned)((dist_slot >> 1) - 1);
size_t base = ((2 | (dist_slot & 1)) << footerBits);
enc->distance_prices[kLastLenToPosState][i] = GetReverseTreePrice(&enc->rc, enc->states.dist_encoders + base - dist_slot - 1,
footerBits,
i - base);
}
for (size_t lenToPosState = 0; lenToPosState < kNumLenToPosStates; ++lenToPosState) {
const Probability* encoder = enc->states.dist_slot_encoders[lenToPosState];
for (size_t dist_slot = 0; dist_slot < enc->dist_price_table_size; ++dist_slot) {
enc->dist_slot_prices[lenToPosState][dist_slot] = GetTreePrice(&enc->rc, encoder, kNumPosSlotBits, dist_slot);
}
for (size_t dist_slot = kEndPosModelIndex; dist_slot < enc->dist_price_table_size; ++dist_slot) {
enc->dist_slot_prices[lenToPosState][dist_slot] += (((unsigned)(dist_slot >> 1) - 1) - kNumAlignBits) << kNumBitPriceShiftBits;
}
size_t i = 0;
for (; i < kStartPosModelIndex; ++i) {
enc->distance_prices[lenToPosState][i] = enc->dist_slot_prices[lenToPosState][i];
}
for (; i < kNumFullDistances; ++i) {
enc->distance_prices[lenToPosState][i] = enc->dist_slot_prices[lenToPosState][distance_table[i]]
+ enc->distance_prices[kLastLenToPosState][i];
}
}
enc->match_price_count = 0;
}
FORCE_INLINE_TEMPLATE
size_t EncodeChunkBest(FL2_lzmaEncoderCtx* enc,
FL2_dataBlock const block,
FL2_matchTable* tbl,
int const structTbl,
size_t index,
size_t uncompressed_end)
{
unsigned search_depth = tbl->params.depth;
FillDistancesPrices(enc);
FillAlignPrices(enc);
UpdateLengthPrices(enc, &enc->states.len_states);
UpdateLengthPrices(enc, &enc->states.rep_len_states);
while (index < uncompressed_end && enc->rc.out_index < enc->rc.chunk_size)
{
Match match = FL2_radixGetMatch(block, tbl, search_depth, structTbl, index);
if (match.length > 1) {
if (enc->strategy != FL2_ultra) {
index = EncodeOptimumSequence(enc, block, tbl, structTbl, 0, index, uncompressed_end, match);
}
else {
index = EncodeOptimumSequence(enc, block, tbl, structTbl, 1, index, uncompressed_end, match);
}
if (enc->match_price_count >= kDistanceRepriceFrequency) {
FillDistancesPrices(enc);
}
if (enc->align_price_count >= kAlignRepriceFrequency) {
FillAlignPrices(enc);
}
}
else {
if (block.data[index] == block.data[index - enc->states.reps[0] - 1]) {
EncodeRepMatch(enc, 1, 0, index & enc->pos_mask);
}
else {
EncodeLiteralBuf(enc, block.data, index);
}
++index;
}
}
Flush(&enc->rc);
return index;
}
static void LengthStates_Reset(LengthStates* ls, unsigned fast_length)
{
ls->choice = kProbInitValue;
ls->choice_2 = kProbInitValue;
for (size_t i = 0; i < (kNumPositionStatesMax << kLenNumLowBits); ++i) {
ls->low[i] = kProbInitValue;
}
for (size_t i = 0; i < (kNumPositionStatesMax << kLenNumMidBits); ++i) {
ls->mid[i] = kProbInitValue;
}
for (size_t i = 0; i < kLenNumHighSymbols; ++i) {
ls->high[i] = kProbInitValue;
}
ls->table_size = fast_length + 1 - kMatchLenMin;
}
static void EncoderStates_Reset(EncoderStates* es, unsigned lc, unsigned lp, unsigned fast_length)
{
es->state = 0;
for (size_t i = 0; i < kNumReps; ++i) {
es->reps[i] = 0;
}
for (size_t i = 0; i < kNumStates; ++i) {
for (size_t j = 0; j < kNumPositionStatesMax; ++j) {
es->is_match[i][j] = kProbInitValue;
es->is_rep0_long[i][j] = kProbInitValue;
}
es->is_rep[i] = kProbInitValue;
es->is_rep_G0[i] = kProbInitValue;
es->is_rep_G1[i] = kProbInitValue;
es->is_rep_G2[i] = kProbInitValue;
}
size_t num = (size_t)(kNumLiterals * kNumLitTables) << (lp + lc);
for (size_t i = 0; i < num; ++i) {
es->literal_probs[i] = kProbInitValue;
}
for (size_t i = 0; i < kNumLenToPosStates; ++i) {
Probability *probs = es->dist_slot_encoders[i];
for (size_t j = 0; j < (1 << kNumPosSlotBits); ++j) {
probs[j] = kProbInitValue;
}
}
for (size_t i = 0; i < kNumFullDistances - kEndPosModelIndex; ++i) {
es->dist_encoders[i] = kProbInitValue;
}
LengthStates_Reset(&es->len_states, fast_length);
LengthStates_Reset(&es->rep_len_states, fast_length);
for (size_t i = 0; i < (1 << kNumAlignBits); ++i) {
es->dist_align_encoders[i] = kProbInitValue;
}
}
BYTE FL2_getDictSizeProp(size_t dictionary_size)
{
BYTE dict_size_prop = 0;
for (BYTE bit = 11; bit < 32; ++bit) {
if (((size_t)2 << bit) >= dictionary_size) {
dict_size_prop = (bit - 11) << 1;
break;
}
if (((size_t)3 << bit) >= dictionary_size) {
dict_size_prop = ((bit - 11) << 1) | 1;
break;
}
}
return dict_size_prop;
}
size_t FL2_lzma2MemoryUsage(unsigned chain_log, FL2_strategy strategy, unsigned thread_count)
{
size_t size = sizeof(FL2_lzmaEncoderCtx) + kChunkBufferSize;
if(strategy == FL2_ultra)
size += sizeof(HashChains) + (sizeof(U32) << chain_log) - sizeof(U32);
return size * thread_count;
}
static void Reset(FL2_lzmaEncoderCtx* enc, size_t max_distance)
{
DEBUGLOG(5, "LZMA encoder reset : max_distance %u", (unsigned)max_distance);
U32 i = 0;
RangeEncReset(&enc->rc);
EncoderStates_Reset(&enc->states, enc->lc, enc->lp, enc->fast_length);
enc->pos_mask = (1 << enc->pb) - 1;
enc->lit_pos_mask = (1 << enc->lp) - 1;
for (; max_distance > (size_t)1 << i; ++i) {
}
enc->dist_price_table_size = i * 2;
}
static BYTE GetLcLpPbCode(FL2_lzmaEncoderCtx* enc)
{
return (BYTE)((enc->pb * 5 + enc->lp) * 9 + enc->lc);
}
BYTE IsChunkRandom(const FL2_matchTable* const tbl,
const FL2_dataBlock block, size_t const start,
unsigned const strategy)
{
if (block.end - start >= kMinTestChunkSize) {
static const size_t max_dist_table[][5] = {
{ 0, 0, 0, 1U << 6, 1U << 14 }, /* fast */
{ 0, 0, 1U << 6, 1U << 14, 1U << 22 }, /* opt */
{ 0, 0, 1U << 6, 1U << 14, 1U << 22 } }; /* ultra */
static const size_t margin_divisor[3] = { 60U, 45U, 120U };
static const double dev_table[3] = { 6.0, 6.0, 5.0 };
size_t const end = MIN(start + kChunkSize, block.end);
size_t const chunk_size = end - start;
size_t count = 0;
size_t const margin = chunk_size / margin_divisor[strategy];
size_t const terminator = start + margin;
if (tbl->isStruct) {
size_t prev_dist = 0;
for (size_t index = start; index < end; ) {
U32 const link = GetMatchLink(tbl->table, index);
if (link == RADIX_NULL_LINK) {
++index;
++count;
prev_dist = 0;
}
else {
size_t length = GetMatchLength(tbl->table, index);
size_t dist = index - GetMatchLink(tbl->table, index);
if (length > 4)
count += dist != prev_dist;
else
count += (dist < max_dist_table[strategy][length]) ? 1 : length;
index += length;
prev_dist = dist;
}
if (count + terminator <= index)
return 0;
}
}
else {
size_t prev_dist = 0;
for (size_t index = start; index < end; ) {
U32 const link = tbl->table[index];
if (link == RADIX_NULL_LINK) {
++index;
++count;
prev_dist = 0;
}
else {
size_t length = link >> RADIX_LINK_BITS;
size_t dist = index - (link & RADIX_LINK_MASK);
if (length > 4)
count += dist != prev_dist;
else
count += (dist < max_dist_table[strategy][length]) ? 1 : length;
index += length;
prev_dist = dist;
}
if (count + terminator <= index)
return 0;
}
}
{ U32 char_count[256];
double char_total = 0.0;
/* Expected normal character count */
double const avg = (double)chunk_size / 256.0;
memset(char_count, 0, sizeof(char_count));
for (size_t index = start; index < end; ++index)
++char_count[block.data[index]];
/* Sum the deviations */
for (size_t i = 0; i < 256; ++i) {
double delta = (double)char_count[i] - avg;
char_total += delta * delta;
}
return sqrt(char_total) / sqrt((double)chunk_size) <= dev_table[strategy];
}
}
return 0;
}
#ifdef __GNUC__
#pragma GCC diagnostic ignored "-Wmaybe-uninitialized"
#else
__pragma(warning(disable:4701))
#endif
size_t FL2_lzma2Encode(FL2_lzmaEncoderCtx* enc,
FL2_matchTable* tbl,
const FL2_dataBlock block,
const FL2_lzma2Parameters* options,
FL2_progressFn progress, void* opaque, size_t base, U32 weight)
{
size_t const start = block.start;
BYTE* out_dest = enc->out_buf;
/* Each encoder writes a properties byte because the upstream encoder(s) could */
/* write only uncompressed chunks with no properties. */
BYTE encode_properties = 1;
BYTE next_is_random = 0;
if (block.end <= block.start) {
return 0;
}
enc->lc = options->lc;
enc->lp = options->lp;
if (enc->lc + enc->lp > 4) {
enc->lc = 3;
enc->lp = 0;
}
enc->pb = options->pb;
enc->strategy = options->strategy;
enc->fast_length = options->fast_length;
enc->match_cycles = options->match_cycles;
Reset(enc, block.end);
if (enc->strategy == FL2_ultra) {
/* Create a hash chain to put the encoder into hybrid mode */
if (enc->hash_alloc_3 < ((ptrdiff_t)1 << options->second_dict_bits)) {
if(HashCreate(enc, options->second_dict_bits) != 0)
return FL2_ERROR(memory_allocation);
}
else {
HashReset(enc, options->second_dict_bits);
}
enc->hash_prev_index = (start >= (size_t)enc->hash_dict_3) ? start - enc->hash_dict_3 : -1;
}
enc->len_end_max = kOptimizerBufferSize - 1;
RMF_limitLengths(tbl, block.end);
for (size_t index = start; index < block.end;)
{
unsigned header_size = encode_properties ? kChunkHeaderSize + 1 : kChunkHeaderSize;
EncoderStates saved_states;
size_t next_index;
size_t compressed_size;
size_t uncompressed_size;
RangeEncReset(&enc->rc);
SetOutputBuffer(&enc->rc, out_dest + header_size, kChunkSize);
if (!next_is_random) {
saved_states = enc->states;
if (index == 0) {
EncodeLiteral(enc, 0, block.data[0], 0);
}
if (enc->strategy == FL2_fast) {
if (tbl->isStruct) {
next_index = EncodeChunkFast(enc, block, tbl, 1,
index + (index == 0),
MIN(block.end, index + kMaxChunkUncompressedSize));
}
else {
next_index = EncodeChunkFast(enc, block, tbl, 0,
index + (index == 0),
MIN(block.end, index + kMaxChunkUncompressedSize));
}
}
else {
if (tbl->isStruct) {
next_index = EncodeChunkBest(enc, block, tbl, 1,
index + (index == 0),
MIN(block.end, index + kMaxChunkUncompressedSize - kOptimizerBufferSize));
}
else {
next_index = EncodeChunkBest(enc, block, tbl, 0,
index + (index == 0),
MIN(block.end, index + kMaxChunkUncompressedSize - kOptimizerBufferSize));
}
}
}
else {
next_index = MIN(index + kChunkSize, block.end);
}
compressed_size = enc->rc.out_index;
uncompressed_size = next_index - index;
out_dest[1] = (BYTE)((uncompressed_size - 1) >> 8);
out_dest[2] = (BYTE)(uncompressed_size - 1);
/* Output an uncompressed chunk if necessary */
if (next_is_random || uncompressed_size + 3 <= compressed_size + header_size) {
DEBUGLOG(5, "Storing chunk : was %u => %u", (unsigned)uncompressed_size, (unsigned)compressed_size);
if (index == 0) {
out_dest[0] = kChunkUncompressedDictReset;
}
else {
out_dest[0] = kChunkUncompressed;
}
memcpy(out_dest + 3, block.data + index, uncompressed_size);
compressed_size = uncompressed_size;
header_size = 3;
if (!next_is_random) {
enc->states = saved_states;
}
}
else {
DEBUGLOG(5, "Compressed chunk : %u => %u", (unsigned)uncompressed_size, (unsigned)compressed_size);
if (index == 0) {
out_dest[0] = kChunkCompressedFlag | kChunkAllReset;
}
else if (encode_properties) {
out_dest[0] = kChunkCompressedFlag | kChunkStatePropertiesReset;
}
else {
out_dest[0] = kChunkCompressedFlag | kChunkNothingReset;
}
out_dest[0] |= (BYTE)((uncompressed_size - 1) >> 16);
out_dest[3] = (BYTE)((compressed_size - 1) >> 8);
out_dest[4] = (BYTE)(compressed_size - 1);
if (encode_properties) {
out_dest[5] = GetLcLpPbCode(enc);
encode_properties = 0;
}
}
if (next_is_random || uncompressed_size + 3 <= compressed_size + (compressed_size >> kRandomFilterMarginBits) + header_size)
{
/* Test the next chunk for compressibility */
next_is_random = IsChunkRandom(tbl, block, next_index, enc->strategy);
}
if (index == start) {
/* After the first chunk we can write data to the match table because the */
/* compressed data will never catch up with the table position being read. */
out_dest = RMF_getTableAsOutputBuffer(tbl, start);
memcpy(out_dest, enc->out_buf, compressed_size + header_size);
}
out_dest += compressed_size + header_size;
index = next_index;
if (progress && progress(base + (((index - start) * weight) >> 4), opaque) != 0)
return FL2_ERROR(canceled);
}
return out_dest - RMF_getTableAsOutputBuffer(tbl, start);
}