| /* Copyright 2013 Google Inc. All Rights Reserved. | |
| Distributed under MIT license. | |
| See file LICENSE for detail or copy at https://opensource.org/licenses/MIT | |
| */ | |
| /* Function to find backward reference copies. */ | |
| #include "./backward_references.h" | |
| #include <math.h> /* INFINITY */ | |
| #include <string.h> /* memcpy, memset */ | |
| #include "../common/constants.h" | |
| #include "../common/types.h" | |
| #include "./command.h" | |
| #include "./fast_log.h" | |
| #include "./find_match_length.h" | |
| #include "./literal_cost.h" | |
| #include "./memory.h" | |
| #include "./port.h" | |
| #include "./prefix.h" | |
| #include "./quality.h" | |
| #if defined(__cplusplus) || defined(c_plusplus) | |
| extern "C" { | |
| #endif | |
| #ifdef INFINITY | |
| static const float kInfinity = INFINITY; | |
| #else | |
| static const float kInfinity = 3.4028e38f; | |
| #endif | |
| void BrotliInitZopfliNodes(ZopfliNode* array, size_t length) { | |
| ZopfliNode stub; | |
| size_t i; | |
| stub.length = 1; | |
| stub.distance = 0; | |
| stub.insert_length = 0; | |
| stub.u.cost = kInfinity; | |
| for (i = 0; i < length; ++i) array[i] = stub; | |
| } | |
| static BROTLI_INLINE uint32_t ZopfliNodeCopyLength(const ZopfliNode* self) { | |
| return self->length & 0xffffff; | |
| } | |
| static BROTLI_INLINE uint32_t ZopfliNodeLengthCode(const ZopfliNode* self) { | |
| const uint32_t modifier = self->length >> 24; | |
| return ZopfliNodeCopyLength(self) + 9u - modifier; | |
| } | |
| static BROTLI_INLINE uint32_t ZopfliNodeCopyDistance(const ZopfliNode* self) { | |
| return self->distance & 0x1ffffff; | |
| } | |
| static BROTLI_INLINE uint32_t ZopfliNodeDistanceCode(const ZopfliNode* self) { | |
| const uint32_t short_code = self->distance >> 25; | |
| return short_code == 0 ? ZopfliNodeCopyDistance(self) + 15 : short_code - 1; | |
| } | |
| static BROTLI_INLINE uint32_t ZopfliNodeCommandLength(const ZopfliNode* self) { | |
| return ZopfliNodeCopyLength(self) + self->insert_length; | |
| } | |
| /* Histogram based cost model for zopflification. */ | |
| typedef struct ZopfliCostModel { | |
| /* The insert and copy length symbols. */ | |
| float cost_cmd_[BROTLI_NUM_COMMAND_SYMBOLS]; | |
| float cost_dist_[BROTLI_NUM_DISTANCE_SYMBOLS]; | |
| /* Cumulative costs of literals per position in the stream. */ | |
| float* literal_costs_; | |
| float min_cost_cmd_; | |
| size_t num_bytes_; | |
| } ZopfliCostModel; | |
| static void InitZopfliCostModel( | |
| MemoryManager* m, ZopfliCostModel* self, size_t num_bytes) { | |
| self->num_bytes_ = num_bytes; | |
| self->literal_costs_ = BROTLI_ALLOC(m, float, num_bytes + 2); | |
| if (BROTLI_IS_OOM(m)) return; | |
| } | |
| static void CleanupZopfliCostModel(MemoryManager* m, ZopfliCostModel* self) { | |
| BROTLI_FREE(m, self->literal_costs_); | |
| } | |
| static void SetCost(const uint32_t* histogram, size_t histogram_size, | |
| float* cost) { | |
| size_t sum = 0; | |
| float log2sum; | |
| size_t i; | |
| for (i = 0; i < histogram_size; i++) { | |
| sum += histogram[i]; | |
| } | |
| log2sum = (float)FastLog2(sum); | |
| for (i = 0; i < histogram_size; i++) { | |
| if (histogram[i] == 0) { | |
| cost[i] = log2sum + 2; | |
| continue; | |
| } | |
| /* Shannon bits for this symbol. */ | |
| cost[i] = log2sum - (float)FastLog2(histogram[i]); | |
| /* Cannot be coded with less than 1 bit */ | |
| if (cost[i] < 1) cost[i] = 1; | |
| } | |
| } | |
| static void ZopfliCostModelSetFromCommands(ZopfliCostModel* self, | |
| size_t position, | |
| const uint8_t* ringbuffer, | |
| size_t ringbuffer_mask, | |
| const Command* commands, | |
| size_t num_commands, | |
| size_t last_insert_len) { | |
| uint32_t histogram_literal[BROTLI_NUM_LITERAL_SYMBOLS]; | |
| uint32_t histogram_cmd[BROTLI_NUM_COMMAND_SYMBOLS]; | |
| uint32_t histogram_dist[BROTLI_NUM_DISTANCE_SYMBOLS]; | |
| float cost_literal[BROTLI_NUM_LITERAL_SYMBOLS]; | |
| size_t pos = position - last_insert_len; | |
| float min_cost_cmd = kInfinity; | |
| size_t i; | |
| float* cost_cmd = self->cost_cmd_; | |
| memset(histogram_literal, 0, sizeof(histogram_literal)); | |
| memset(histogram_cmd, 0, sizeof(histogram_cmd)); | |
| memset(histogram_dist, 0, sizeof(histogram_dist)); | |
| for (i = 0; i < num_commands; i++) { | |
| size_t inslength = commands[i].insert_len_; | |
| size_t copylength = CommandCopyLen(&commands[i]); | |
| size_t distcode = commands[i].dist_prefix_; | |
| size_t cmdcode = commands[i].cmd_prefix_; | |
| size_t j; | |
| histogram_cmd[cmdcode]++; | |
| if (cmdcode >= 128) histogram_dist[distcode]++; | |
| for (j = 0; j < inslength; j++) { | |
| histogram_literal[ringbuffer[(pos + j) & ringbuffer_mask]]++; | |
| } | |
| pos += inslength + copylength; | |
| } | |
| SetCost(histogram_literal, BROTLI_NUM_LITERAL_SYMBOLS, cost_literal); | |
| SetCost(histogram_cmd, BROTLI_NUM_COMMAND_SYMBOLS, cost_cmd); | |
| SetCost(histogram_dist, BROTLI_NUM_DISTANCE_SYMBOLS, self->cost_dist_); | |
| for (i = 0; i < BROTLI_NUM_COMMAND_SYMBOLS; ++i) { | |
| min_cost_cmd = BROTLI_MIN(float, min_cost_cmd, cost_cmd[i]); | |
| } | |
| self->min_cost_cmd_ = min_cost_cmd; | |
| { | |
| float* literal_costs = self->literal_costs_; | |
| size_t num_bytes = self->num_bytes_; | |
| literal_costs[0] = 0.0; | |
| for (i = 0; i < num_bytes; ++i) { | |
| literal_costs[i + 1] = literal_costs[i] + | |
| cost_literal[ringbuffer[(position + i) & ringbuffer_mask]]; | |
| } | |
| } | |
| } | |
| static void ZopfliCostModelSetFromLiteralCosts(ZopfliCostModel* self, | |
| size_t position, | |
| const uint8_t* ringbuffer, | |
| size_t ringbuffer_mask) { | |
| float* literal_costs = self->literal_costs_; | |
| float* cost_dist = self->cost_dist_; | |
| float* cost_cmd = self->cost_cmd_; | |
| size_t num_bytes = self->num_bytes_; | |
| size_t i; | |
| BrotliEstimateBitCostsForLiterals(position, num_bytes, ringbuffer_mask, | |
| ringbuffer, &literal_costs[1]); | |
| literal_costs[0] = 0.0; | |
| for (i = 0; i < num_bytes; ++i) { | |
| literal_costs[i + 1] += literal_costs[i]; | |
| } | |
| for (i = 0; i < BROTLI_NUM_COMMAND_SYMBOLS; ++i) { | |
| cost_cmd[i] = (float)FastLog2(11 + (uint32_t)i); | |
| } | |
| for (i = 0; i < BROTLI_NUM_DISTANCE_SYMBOLS; ++i) { | |
| cost_dist[i] = (float)FastLog2(20 + (uint32_t)i); | |
| } | |
| self->min_cost_cmd_ = (float)FastLog2(11); | |
| } | |
| static BROTLI_INLINE float ZopfliCostModelGetCommandCost( | |
| const ZopfliCostModel* self, uint16_t cmdcode) { | |
| return self->cost_cmd_[cmdcode]; | |
| } | |
| static BROTLI_INLINE float ZopfliCostModelGetDistanceCost( | |
| const ZopfliCostModel* self, size_t distcode) { | |
| return self->cost_dist_[distcode]; | |
| } | |
| static BROTLI_INLINE float ZopfliCostModelGetLiteralCosts( | |
| const ZopfliCostModel* self, size_t from, size_t to) { | |
| return self->literal_costs_[to] - self->literal_costs_[from]; | |
| } | |
| static BROTLI_INLINE float ZopfliCostModelGetMinCostCmd( | |
| const ZopfliCostModel* self) { | |
| return self->min_cost_cmd_; | |
| } | |
| static BROTLI_INLINE size_t ComputeDistanceCode(size_t distance, | |
| size_t max_distance, | |
| const int* dist_cache) { | |
| if (distance <= max_distance) { | |
| size_t distance_plus_3 = distance + 3; | |
| size_t offset0 = distance_plus_3 - (size_t)dist_cache[0]; | |
| size_t offset1 = distance_plus_3 - (size_t)dist_cache[1]; | |
| if (distance == (size_t)dist_cache[0]) { | |
| return 0; | |
| } else if (distance == (size_t)dist_cache[1]) { | |
| return 1; | |
| } else if (offset0 < 7) { | |
| return (0x9750468 >> (4 * offset0)) & 0xF; | |
| } else if (offset1 < 7) { | |
| return (0xFDB1ACE >> (4 * offset1)) & 0xF; | |
| } else if (distance == (size_t)dist_cache[2]) { | |
| return 2; | |
| } else if (distance == (size_t)dist_cache[3]) { | |
| return 3; | |
| } | |
| } | |
| return distance + 15; | |
| } | |
| /* REQUIRES: len >= 2, start_pos <= pos */ | |
| /* REQUIRES: cost < kInfinity, nodes[start_pos].cost < kInfinity */ | |
| /* Maintains the "ZopfliNode array invariant". */ | |
| static BROTLI_INLINE void UpdateZopfliNode(ZopfliNode* nodes, size_t pos, | |
| size_t start_pos, size_t len, size_t len_code, size_t dist, | |
| size_t short_code, float cost) { | |
| ZopfliNode* next = &nodes[pos + len]; | |
| next->length = (uint32_t)(len | ((len + 9u - len_code) << 24)); | |
| next->distance = (uint32_t)(dist | (short_code << 25)); | |
| next->insert_length = (uint32_t)(pos - start_pos); | |
| next->u.cost = cost; | |
| } | |
| typedef struct PosData { | |
| size_t pos; | |
| int distance_cache[4]; | |
| float costdiff; | |
| float cost; | |
| } PosData; | |
| /* Maintains the smallest 8 cost difference together with their positions */ | |
| typedef struct StartPosQueue { | |
| PosData q_[8]; | |
| size_t idx_; | |
| } StartPosQueue; | |
| static BROTLI_INLINE void InitStartPosQueue(StartPosQueue* self) { | |
| self->idx_ = 0; | |
| } | |
| static size_t StartPosQueueSize(const StartPosQueue* self) { | |
| return BROTLI_MIN(size_t, self->idx_, 8); | |
| } | |
| static void StartPosQueuePush(StartPosQueue* self, const PosData* posdata) { | |
| size_t offset = ~(self->idx_++) & 7; | |
| size_t len = StartPosQueueSize(self); | |
| size_t i; | |
| PosData* q = self->q_; | |
| q[offset] = *posdata; | |
| /* Restore the sorted order. In the list of |len| items at most |len - 1| | |
| adjacent element comparisons / swaps are required. */ | |
| for (i = 1; i < len; ++i) { | |
| if (q[offset & 7].costdiff > q[(offset + 1) & 7].costdiff) { | |
| BROTLI_SWAP(PosData, q, offset & 7, (offset + 1) & 7); | |
| } | |
| ++offset; | |
| } | |
| } | |
| static const PosData* StartPosQueueAt(const StartPosQueue* self, size_t k) { | |
| return &self->q_[(k - self->idx_) & 7]; | |
| } | |
| /* Returns the minimum possible copy length that can improve the cost of any */ | |
| /* future position. */ | |
| static size_t ComputeMinimumCopyLength(const float start_cost, | |
| const ZopfliNode* nodes, | |
| const size_t num_bytes, | |
| const size_t pos) { | |
| /* Compute the minimum possible cost of reaching any future position. */ | |
| float min_cost = start_cost; | |
| size_t len = 2; | |
| size_t next_len_bucket = 4; | |
| size_t next_len_offset = 10; | |
| while (pos + len <= num_bytes && nodes[pos + len].u.cost <= min_cost) { | |
| /* We already reached (pos + len) with no more cost than the minimum | |
| possible cost of reaching anything from this pos, so there is no point in | |
| looking for lengths <= len. */ | |
| ++len; | |
| if (len == next_len_offset) { | |
| /* We reached the next copy length code bucket, so we add one more | |
| extra bit to the minimum cost. */ | |
| min_cost += 1.0f; | |
| next_len_offset += next_len_bucket; | |
| next_len_bucket *= 2; | |
| } | |
| } | |
| return len; | |
| } | |
| /* REQUIRES: nodes[pos].cost < kInfinity | |
| REQUIRES: nodes[0..pos] satisfies that "ZopfliNode array invariant". */ | |
| static uint32_t ComputeDistanceShortcut(const size_t block_start, | |
| const size_t pos, | |
| const size_t max_backward, | |
| const ZopfliNode* nodes) { | |
| const size_t clen = ZopfliNodeCopyLength(&nodes[pos]); | |
| const size_t ilen = nodes[pos].insert_length; | |
| const size_t dist = ZopfliNodeCopyDistance(&nodes[pos]); | |
| /* Since |block_start + pos| is the end position of the command, the copy part | |
| starts from |block_start + pos - clen|. Distances that are greater than | |
| this or greater than |max_backward| are static dictionary references, and | |
| do not update the last distances. Also distance code 0 (last distance) | |
| does not update the last distances. */ | |
| if (pos == 0) { | |
| return 0; | |
| } else if (dist + clen <= block_start + pos && | |
| dist <= max_backward && | |
| ZopfliNodeDistanceCode(&nodes[pos]) > 0) { | |
| return (uint32_t)pos; | |
| } else { | |
| return nodes[pos - clen - ilen].u.shortcut; | |
| } | |
| } | |
| /* Fills in dist_cache[0..3] with the last four distances (as defined by | |
| Section 4. of the Spec) that would be used at (block_start + pos) if we | |
| used the shortest path of commands from block_start, computed from | |
| nodes[0..pos]. The last four distances at block_start are in | |
| starting_dist_cach[0..3]. | |
| REQUIRES: nodes[pos].cost < kInfinity | |
| REQUIRES: nodes[0..pos] satisfies that "ZopfliNode array invariant". */ | |
| static void ComputeDistanceCache(const size_t pos, | |
| const int* starting_dist_cache, | |
| const ZopfliNode* nodes, | |
| int* dist_cache) { | |
| int idx = 0; | |
| size_t p = nodes[pos].u.shortcut; | |
| while (idx < 4 && p > 0) { | |
| const size_t ilen = nodes[p].insert_length; | |
| const size_t clen = ZopfliNodeCopyLength(&nodes[p]); | |
| const size_t dist = ZopfliNodeCopyDistance(&nodes[p]); | |
| dist_cache[idx++] = (int)dist; | |
| /* Because of prerequisite, p >= clen + ilen >= 2. */ | |
| p = nodes[p - clen - ilen].u.shortcut; | |
| } | |
| for (; idx < 4; ++idx) { | |
| dist_cache[idx] = *starting_dist_cache++; | |
| } | |
| } | |
| static void UpdateNodes(const size_t num_bytes, | |
| const size_t block_start, | |
| const size_t pos, | |
| const uint8_t* ringbuffer, | |
| const size_t ringbuffer_mask, | |
| const BrotliEncoderParams* params, | |
| const size_t max_backward_limit, | |
| const int* starting_dist_cache, | |
| const size_t num_matches, | |
| const BackwardMatch* matches, | |
| const ZopfliCostModel* model, | |
| StartPosQueue* queue, | |
| ZopfliNode* nodes) { | |
| const size_t cur_ix = block_start + pos; | |
| const size_t cur_ix_masked = cur_ix & ringbuffer_mask; | |
| const size_t max_distance = BROTLI_MIN(size_t, cur_ix, max_backward_limit); | |
| const size_t max_len = num_bytes - pos; | |
| const size_t max_zopfli_len = MaxZopfliLen(params); | |
| const size_t max_iters = MaxZopfliCandidates(params); | |
| size_t min_len; | |
| size_t k; | |
| { | |
| /* Save cost, because ComputeDistanceCache invalidates it. */ | |
| float node_cost = nodes[pos].u.cost; | |
| nodes[pos].u.shortcut = ComputeDistanceShortcut( | |
| block_start, pos, max_backward_limit, nodes); | |
| if (node_cost <= ZopfliCostModelGetLiteralCosts(model, 0, pos)) { | |
| PosData posdata; | |
| posdata.pos = pos; | |
| posdata.cost = node_cost; | |
| posdata.costdiff = node_cost - | |
| ZopfliCostModelGetLiteralCosts(model, 0, pos); | |
| ComputeDistanceCache( | |
| pos, starting_dist_cache, nodes, posdata.distance_cache); | |
| StartPosQueuePush(queue, &posdata); | |
| } | |
| } | |
| { | |
| const PosData* posdata = StartPosQueueAt(queue, 0); | |
| float min_cost = (posdata->cost + ZopfliCostModelGetMinCostCmd(model) + | |
| ZopfliCostModelGetLiteralCosts(model, posdata->pos, pos)); | |
| min_len = ComputeMinimumCopyLength(min_cost, nodes, num_bytes, pos); | |
| } | |
| /* Go over the command starting positions in order of increasing cost | |
| difference. */ | |
| for (k = 0; k < max_iters && k < StartPosQueueSize(queue); ++k) { | |
| const PosData* posdata = StartPosQueueAt(queue, k); | |
| const size_t start = posdata->pos; | |
| const uint16_t inscode = GetInsertLengthCode(pos - start); | |
| const float start_costdiff = posdata->costdiff; | |
| const float base_cost = start_costdiff + (float)GetInsertExtra(inscode) + | |
| ZopfliCostModelGetLiteralCosts(model, 0, pos); | |
| /* Look for last distance matches using the distance cache from this | |
| starting position. */ | |
| size_t best_len = min_len - 1; | |
| size_t j = 0; | |
| for (; j < BROTLI_NUM_DISTANCE_SHORT_CODES && best_len < max_len; ++j) { | |
| const size_t idx = kDistanceCacheIndex[j]; | |
| const size_t backward = | |
| (size_t)(posdata->distance_cache[idx] + kDistanceCacheOffset[j]); | |
| size_t prev_ix = cur_ix - backward; | |
| if (prev_ix >= cur_ix) { | |
| continue; | |
| } | |
| if (PREDICT_FALSE(backward > max_distance)) { | |
| continue; | |
| } | |
| prev_ix &= ringbuffer_mask; | |
| if (cur_ix_masked + best_len > ringbuffer_mask || | |
| prev_ix + best_len > ringbuffer_mask || | |
| ringbuffer[cur_ix_masked + best_len] != | |
| ringbuffer[prev_ix + best_len]) { | |
| continue; | |
| } | |
| { | |
| const size_t len = | |
| FindMatchLengthWithLimit(&ringbuffer[prev_ix], | |
| &ringbuffer[cur_ix_masked], | |
| max_len); | |
| const float dist_cost = base_cost + | |
| ZopfliCostModelGetDistanceCost(model, j); | |
| size_t l; | |
| for (l = best_len + 1; l <= len; ++l) { | |
| const uint16_t copycode = GetCopyLengthCode(l); | |
| const uint16_t cmdcode = | |
| CombineLengthCodes(inscode, copycode, j == 0); | |
| const float cost = (cmdcode < 128 ? base_cost : dist_cost) + | |
| (float)GetCopyExtra(copycode) + | |
| ZopfliCostModelGetCommandCost(model, cmdcode); | |
| if (cost < nodes[pos + l].u.cost) { | |
| UpdateZopfliNode(nodes, pos, start, l, l, backward, j + 1, cost); | |
| } | |
| best_len = l; | |
| } | |
| } | |
| } | |
| /* At higher iterations look only for new last distance matches, since | |
| looking only for new command start positions with the same distances | |
| does not help much. */ | |
| if (k >= 2) continue; | |
| { | |
| /* Loop through all possible copy lengths at this position. */ | |
| size_t len = min_len; | |
| for (j = 0; j < num_matches; ++j) { | |
| BackwardMatch match = matches[j]; | |
| size_t dist = match.distance; | |
| BROTLI_BOOL is_dictionary_match = TO_BROTLI_BOOL(dist > max_distance); | |
| /* We already tried all possible last distance matches, so we can use | |
| normal distance code here. */ | |
| size_t dist_code = dist + 15; | |
| uint16_t dist_symbol; | |
| uint32_t distextra; | |
| uint32_t distnumextra; | |
| float dist_cost; | |
| size_t max_match_len; | |
| PrefixEncodeCopyDistance(dist_code, 0, 0, &dist_symbol, &distextra); | |
| distnumextra = distextra >> 24; | |
| dist_cost = base_cost + (float)distnumextra + | |
| ZopfliCostModelGetDistanceCost(model, dist_symbol); | |
| /* Try all copy lengths up until the maximum copy length corresponding | |
| to this distance. If the distance refers to the static dictionary, or | |
| the maximum length is long enough, try only one maximum length. */ | |
| max_match_len = BackwardMatchLength(&match); | |
| if (len < max_match_len && | |
| (is_dictionary_match || max_match_len > max_zopfli_len)) { | |
| len = max_match_len; | |
| } | |
| for (; len <= max_match_len; ++len) { | |
| const size_t len_code = | |
| is_dictionary_match ? BackwardMatchLengthCode(&match) : len; | |
| const uint16_t copycode = GetCopyLengthCode(len_code); | |
| const uint16_t cmdcode = CombineLengthCodes(inscode, copycode, 0); | |
| const float cost = dist_cost + (float)GetCopyExtra(copycode) + | |
| ZopfliCostModelGetCommandCost(model, cmdcode); | |
| if (cost < nodes[pos + len].u.cost) { | |
| UpdateZopfliNode(nodes, pos, start, len, len_code, dist, 0, cost); | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| static size_t ComputeShortestPathFromNodes(size_t num_bytes, | |
| ZopfliNode* nodes) { | |
| size_t index = num_bytes; | |
| size_t num_commands = 0; | |
| while (nodes[index].insert_length == 0 && nodes[index].length == 1) --index; | |
| nodes[index].u.next = BROTLI_UINT32_MAX; | |
| while (index != 0) { | |
| size_t len = ZopfliNodeCommandLength(&nodes[index]); | |
| index -= len; | |
| nodes[index].u.next = (uint32_t)len; | |
| num_commands++; | |
| } | |
| return num_commands; | |
| } | |
| void BrotliZopfliCreateCommands(const size_t num_bytes, | |
| const size_t block_start, | |
| const size_t max_backward_limit, | |
| const ZopfliNode* nodes, | |
| int* dist_cache, | |
| size_t* last_insert_len, | |
| Command* commands, | |
| size_t* num_literals) { | |
| size_t pos = 0; | |
| uint32_t offset = nodes[0].u.next; | |
| size_t i; | |
| for (i = 0; offset != BROTLI_UINT32_MAX; i++) { | |
| const ZopfliNode* next = &nodes[pos + offset]; | |
| size_t copy_length = ZopfliNodeCopyLength(next); | |
| size_t insert_length = next->insert_length; | |
| pos += insert_length; | |
| offset = next->u.next; | |
| if (i == 0) { | |
| insert_length += *last_insert_len; | |
| *last_insert_len = 0; | |
| } | |
| { | |
| size_t distance = ZopfliNodeCopyDistance(next); | |
| size_t len_code = ZopfliNodeLengthCode(next); | |
| size_t max_distance = | |
| BROTLI_MIN(size_t, block_start + pos, max_backward_limit); | |
| BROTLI_BOOL is_dictionary = TO_BROTLI_BOOL(distance > max_distance); | |
| size_t dist_code = ZopfliNodeDistanceCode(next); | |
| InitCommand( | |
| &commands[i], insert_length, copy_length, len_code, dist_code); | |
| if (!is_dictionary && dist_code > 0) { | |
| dist_cache[3] = dist_cache[2]; | |
| dist_cache[2] = dist_cache[1]; | |
| dist_cache[1] = dist_cache[0]; | |
| dist_cache[0] = (int)distance; | |
| } | |
| } | |
| *num_literals += insert_length; | |
| pos += copy_length; | |
| } | |
| *last_insert_len += num_bytes - pos; | |
| } | |
| static size_t ZopfliIterate(size_t num_bytes, | |
| size_t position, | |
| const uint8_t* ringbuffer, | |
| size_t ringbuffer_mask, | |
| const BrotliEncoderParams* params, | |
| const size_t max_backward_limit, | |
| const int* dist_cache, | |
| const ZopfliCostModel* model, | |
| const uint32_t* num_matches, | |
| const BackwardMatch* matches, | |
| ZopfliNode* nodes) { | |
| const size_t max_zopfli_len = MaxZopfliLen(params); | |
| StartPosQueue queue; | |
| size_t cur_match_pos = 0; | |
| size_t i; | |
| nodes[0].length = 0; | |
| nodes[0].u.cost = 0; | |
| InitStartPosQueue(&queue); | |
| for (i = 0; i + 3 < num_bytes; i++) { | |
| UpdateNodes(num_bytes, position, i, ringbuffer, ringbuffer_mask, | |
| params, max_backward_limit, dist_cache, num_matches[i], | |
| &matches[cur_match_pos], model, &queue, nodes); | |
| cur_match_pos += num_matches[i]; | |
| /* The zopflification can be too slow in case of very long lengths, so in | |
| such case skip it all, it does not cost a lot of compression ratio. */ | |
| if (num_matches[i] == 1 && | |
| BackwardMatchLength(&matches[cur_match_pos - 1]) > max_zopfli_len) { | |
| i += BackwardMatchLength(&matches[cur_match_pos - 1]) - 1; | |
| InitStartPosQueue(&queue); | |
| } | |
| } | |
| return ComputeShortestPathFromNodes(num_bytes, nodes); | |
| } | |
| size_t BrotliZopfliComputeShortestPath(MemoryManager* m, | |
| size_t num_bytes, | |
| size_t position, | |
| const uint8_t* ringbuffer, | |
| size_t ringbuffer_mask, | |
| const BrotliEncoderParams* params, | |
| const size_t max_backward_limit, | |
| const int* dist_cache, | |
| H10* hasher, | |
| ZopfliNode* nodes) { | |
| const size_t max_zopfli_len = MaxZopfliLen(params); | |
| ZopfliCostModel model; | |
| StartPosQueue queue; | |
| BackwardMatch matches[MAX_NUM_MATCHES_H10]; | |
| const size_t store_end = num_bytes >= StoreLookaheadH10() ? | |
| position + num_bytes - StoreLookaheadH10() + 1 : position; | |
| size_t i; | |
| nodes[0].length = 0; | |
| nodes[0].u.cost = 0; | |
| InitZopfliCostModel(m, &model, num_bytes); | |
| if (BROTLI_IS_OOM(m)) return 0; | |
| ZopfliCostModelSetFromLiteralCosts( | |
| &model, position, ringbuffer, ringbuffer_mask); | |
| InitStartPosQueue(&queue); | |
| for (i = 0; i + HashTypeLengthH10() - 1 < num_bytes; i++) { | |
| const size_t pos = position + i; | |
| const size_t max_distance = BROTLI_MIN(size_t, pos, max_backward_limit); | |
| size_t num_matches = FindAllMatchesH10(hasher, ringbuffer, ringbuffer_mask, | |
| pos, num_bytes - i, max_distance, params, matches); | |
| if (num_matches > 0 && | |
| BackwardMatchLength(&matches[num_matches - 1]) > max_zopfli_len) { | |
| matches[0] = matches[num_matches - 1]; | |
| num_matches = 1; | |
| } | |
| UpdateNodes(num_bytes, position, i, ringbuffer, ringbuffer_mask, | |
| params, max_backward_limit, dist_cache, num_matches, matches, | |
| &model, &queue, nodes); | |
| if (num_matches == 1 && BackwardMatchLength(&matches[0]) > max_zopfli_len) { | |
| /* Add the tail of the copy to the hasher. */ | |
| StoreRangeH10(hasher, ringbuffer, ringbuffer_mask, pos + 1, BROTLI_MIN( | |
| size_t, pos + BackwardMatchLength(&matches[0]), store_end)); | |
| i += BackwardMatchLength(&matches[0]) - 1; | |
| InitStartPosQueue(&queue); | |
| } | |
| } | |
| CleanupZopfliCostModel(m, &model); | |
| return ComputeShortestPathFromNodes(num_bytes, nodes); | |
| } | |
| #define EXPAND_CAT(a, b) CAT(a, b) | |
| #define CAT(a, b) a ## b | |
| #define FN(X) EXPAND_CAT(X, HASHER()) | |
| #define HASHER() H2 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H3 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H4 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H5 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H6 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H7 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H8 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H9 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H40 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H41 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #define HASHER() H42 | |
| /* NOLINTNEXTLINE(build/include) */ | |
| #include "./backward_references_inc.h" | |
| #undef HASHER | |
| #undef FN | |
| #undef CAT | |
| #undef EXPAND_CAT | |
| static BROTLI_NOINLINE void CreateZopfliBackwardReferences( | |
| MemoryManager* m, size_t num_bytes, size_t position, BROTLI_BOOL is_last, | |
| const uint8_t* ringbuffer, size_t ringbuffer_mask, | |
| const BrotliEncoderParams* params, H10* hasher, int* dist_cache, | |
| size_t* last_insert_len, Command* commands, size_t* num_commands, | |
| size_t* num_literals) { | |
| const size_t max_backward_limit = MaxBackwardLimit(params->lgwin); | |
| ZopfliNode* nodes; | |
| InitH10(m, hasher, ringbuffer, params, position, num_bytes, is_last); | |
| if (BROTLI_IS_OOM(m)) return; | |
| StitchToPreviousBlockH10(hasher, num_bytes, position, | |
| ringbuffer, ringbuffer_mask); | |
| nodes = BROTLI_ALLOC(m, ZopfliNode, num_bytes + 1); | |
| if (BROTLI_IS_OOM(m)) return; | |
| BrotliInitZopfliNodes(nodes, num_bytes + 1); | |
| *num_commands += BrotliZopfliComputeShortestPath(m, num_bytes, position, | |
| ringbuffer, ringbuffer_mask, params, max_backward_limit, | |
| dist_cache, hasher, nodes); | |
| if (BROTLI_IS_OOM(m)) return; | |
| BrotliZopfliCreateCommands(num_bytes, position, max_backward_limit, nodes, | |
| dist_cache, last_insert_len, commands, num_literals); | |
| BROTLI_FREE(m, nodes); | |
| } | |
| static BROTLI_NOINLINE void CreateHqZopfliBackwardReferences( | |
| MemoryManager* m, size_t num_bytes, size_t position, BROTLI_BOOL is_last, | |
| const uint8_t* ringbuffer, size_t ringbuffer_mask, | |
| const BrotliEncoderParams* params, H10* hasher, int* dist_cache, | |
| size_t* last_insert_len, Command* commands, size_t* num_commands, | |
| size_t* num_literals) { | |
| const size_t max_backward_limit = MaxBackwardLimit(params->lgwin); | |
| uint32_t* num_matches = BROTLI_ALLOC(m, uint32_t, num_bytes); | |
| size_t matches_size = 4 * num_bytes; | |
| const size_t store_end = num_bytes >= StoreLookaheadH10() ? | |
| position + num_bytes - StoreLookaheadH10() + 1 : position; | |
| size_t cur_match_pos = 0; | |
| size_t i; | |
| size_t orig_num_literals; | |
| size_t orig_last_insert_len; | |
| int orig_dist_cache[4]; | |
| size_t orig_num_commands; | |
| ZopfliCostModel model; | |
| ZopfliNode* nodes; | |
| BackwardMatch* matches = BROTLI_ALLOC(m, BackwardMatch, matches_size); | |
| if (BROTLI_IS_OOM(m)) return; | |
| InitH10(m, hasher, ringbuffer, params, position, num_bytes, is_last); | |
| if (BROTLI_IS_OOM(m)) return; | |
| StitchToPreviousBlockH10(hasher, num_bytes, position, | |
| ringbuffer, ringbuffer_mask); | |
| for (i = 0; i + HashTypeLengthH10() - 1 < num_bytes; ++i) { | |
| const size_t pos = position + i; | |
| size_t max_distance = BROTLI_MIN(size_t, pos, max_backward_limit); | |
| size_t max_length = num_bytes - i; | |
| size_t num_found_matches; | |
| size_t cur_match_end; | |
| size_t j; | |
| /* Ensure that we have enough free slots. */ | |
| BROTLI_ENSURE_CAPACITY(m, BackwardMatch, matches, matches_size, | |
| cur_match_pos + MAX_NUM_MATCHES_H10); | |
| if (BROTLI_IS_OOM(m)) return; | |
| num_found_matches = FindAllMatchesH10(hasher, ringbuffer, ringbuffer_mask, | |
| pos, max_length, max_distance, params, &matches[cur_match_pos]); | |
| cur_match_end = cur_match_pos + num_found_matches; | |
| for (j = cur_match_pos; j + 1 < cur_match_end; ++j) { | |
| assert(BackwardMatchLength(&matches[j]) < | |
| BackwardMatchLength(&matches[j + 1])); | |
| assert(matches[j].distance > max_distance || | |
| matches[j].distance <= matches[j + 1].distance); | |
| } | |
| num_matches[i] = (uint32_t)num_found_matches; | |
| if (num_found_matches > 0) { | |
| const size_t match_len = BackwardMatchLength(&matches[cur_match_end - 1]); | |
| if (match_len > MAX_ZOPFLI_LEN_QUALITY_11) { | |
| const size_t skip = match_len - 1; | |
| matches[cur_match_pos++] = matches[cur_match_end - 1]; | |
| num_matches[i] = 1; | |
| /* Add the tail of the copy to the hasher. */ | |
| StoreRangeH10(hasher, ringbuffer, ringbuffer_mask, pos + 1, | |
| BROTLI_MIN(size_t, pos + match_len, store_end)); | |
| memset(&num_matches[i + 1], 0, skip * sizeof(num_matches[0])); | |
| i += skip; | |
| } else { | |
| cur_match_pos = cur_match_end; | |
| } | |
| } | |
| } | |
| orig_num_literals = *num_literals; | |
| orig_last_insert_len = *last_insert_len; | |
| memcpy(orig_dist_cache, dist_cache, 4 * sizeof(dist_cache[0])); | |
| orig_num_commands = *num_commands; | |
| nodes = BROTLI_ALLOC(m, ZopfliNode, num_bytes + 1); | |
| if (BROTLI_IS_OOM(m)) return; | |
| InitZopfliCostModel(m, &model, num_bytes); | |
| if (BROTLI_IS_OOM(m)) return; | |
| for (i = 0; i < 2; i++) { | |
| BrotliInitZopfliNodes(nodes, num_bytes + 1); | |
| if (i == 0) { | |
| ZopfliCostModelSetFromLiteralCosts( | |
| &model, position, ringbuffer, ringbuffer_mask); | |
| } else { | |
| ZopfliCostModelSetFromCommands(&model, position, ringbuffer, | |
| ringbuffer_mask, commands, *num_commands - orig_num_commands, | |
| orig_last_insert_len); | |
| } | |
| *num_commands = orig_num_commands; | |
| *num_literals = orig_num_literals; | |
| *last_insert_len = orig_last_insert_len; | |
| memcpy(dist_cache, orig_dist_cache, 4 * sizeof(dist_cache[0])); | |
| *num_commands += ZopfliIterate(num_bytes, position, ringbuffer, | |
| ringbuffer_mask, params, max_backward_limit, dist_cache, | |
| &model, num_matches, matches, nodes); | |
| BrotliZopfliCreateCommands(num_bytes, position, max_backward_limit, | |
| nodes, dist_cache, last_insert_len, commands, num_literals); | |
| } | |
| CleanupZopfliCostModel(m, &model); | |
| BROTLI_FREE(m, nodes); | |
| BROTLI_FREE(m, matches); | |
| BROTLI_FREE(m, num_matches); | |
| } | |
| void BrotliCreateBackwardReferences(MemoryManager* m, | |
| size_t num_bytes, | |
| size_t position, | |
| BROTLI_BOOL is_last, | |
| const uint8_t* ringbuffer, | |
| size_t ringbuffer_mask, | |
| const BrotliEncoderParams* params, | |
| Hashers* hashers, | |
| int* dist_cache, | |
| size_t* last_insert_len, | |
| Command* commands, | |
| size_t* num_commands, | |
| size_t* num_literals) { | |
| if (params->quality == ZOPFLIFICATION_QUALITY) { | |
| CreateZopfliBackwardReferences( | |
| m, num_bytes, position, is_last, ringbuffer, ringbuffer_mask, | |
| params, hashers->h10, dist_cache, | |
| last_insert_len, commands, num_commands, num_literals); | |
| return; | |
| } else if (params->quality == HQ_ZOPFLIFICATION_QUALITY) { | |
| CreateHqZopfliBackwardReferences( | |
| m, num_bytes, position, is_last, ringbuffer, ringbuffer_mask, | |
| params, hashers->h10, dist_cache, | |
| last_insert_len, commands, num_commands, num_literals); | |
| return; | |
| } | |
| switch (ChooseHasher(params)) { | |
| #define _CASE(N) \ | |
| case N: \ | |
| CreateBackwardReferencesH ## N(m, num_bytes, position, is_last, \ | |
| ringbuffer, ringbuffer_mask, params, hashers->h ## N, dist_cache, \ | |
| last_insert_len, commands, num_commands, num_literals); \ | |
| break; | |
| FOR_GENERIC_HASHERS(_CASE) | |
| #undef _CASE | |
| default: | |
| break; | |
| } | |
| if (BROTLI_IS_OOM(m)) return; | |
| } | |
| #if defined(__cplusplus) || defined(c_plusplus) | |
| } /* extern "C" */ | |
| #endif |