package brotli /* Copyright 2014 Google Inc. All Rights Reserved. Distributed under MIT license. See file LICENSE for detail or copy at https://opensource.org/licenses/MIT */ /* Algorithms for distributing the literals and commands of a metablock between block types and contexts. */ type metaBlockSplit struct { literal_split blockSplit command_split blockSplit distance_split blockSplit literal_context_map []uint32 literal_context_map_size uint distance_context_map []uint32 distance_context_map_size uint literal_histograms []histogramLiteral literal_histograms_size uint command_histograms []histogramCommand command_histograms_size uint distance_histograms []histogramDistance distance_histograms_size uint } func initMetaBlockSplit(mb *metaBlockSplit) { initBlockSplit(&mb.literal_split) initBlockSplit(&mb.command_split) initBlockSplit(&mb.distance_split) mb.literal_context_map = nil mb.literal_context_map_size = 0 mb.distance_context_map = nil mb.distance_context_map_size = 0 mb.literal_histograms = nil mb.literal_histograms_size = 0 mb.command_histograms = nil mb.command_histograms_size = 0 mb.distance_histograms = nil mb.distance_histograms_size = 0 } func destroyMetaBlockSplit(mb *metaBlockSplit) { destroyBlockSplit(&mb.literal_split) destroyBlockSplit(&mb.command_split) destroyBlockSplit(&mb.distance_split) mb.literal_context_map = nil mb.distance_context_map = nil mb.literal_histograms = nil mb.command_histograms = nil mb.distance_histograms = nil } func initDistanceParams(params *encoderParams, npostfix uint32, ndirect uint32) { var dist_params *distanceParams = ¶ms.dist var alphabet_size uint32 var max_distance uint32 dist_params.distance_postfix_bits = npostfix dist_params.num_direct_distance_codes = ndirect alphabet_size = uint32(distanceAlphabetSize(uint(npostfix), uint(ndirect), maxDistanceBits)) max_distance = ndirect + (1 << (maxDistanceBits + npostfix + 2)) - (1 << (npostfix + 2)) if params.large_window { var bound = [maxNpostfix + 1]uint32{0, 4, 12, 28} var postfix uint32 = 1 << npostfix alphabet_size = uint32(distanceAlphabetSize(uint(npostfix), uint(ndirect), largeMaxDistanceBits)) /* The maximum distance is set so that no distance symbol used can encode a distance larger than BROTLI_MAX_ALLOWED_DISTANCE with all its extra bits set. */ if ndirect < bound[npostfix] { max_distance = maxAllowedDistance - (bound[npostfix] - ndirect) } else if ndirect >= bound[npostfix]+postfix { max_distance = (3 << 29) - 4 + (ndirect - bound[npostfix]) } else { max_distance = maxAllowedDistance } } dist_params.alphabet_size = alphabet_size dist_params.max_distance = uint(max_distance) } func recomputeDistancePrefixes(cmds []command, num_commands uint, orig_params *distanceParams, new_params *distanceParams) { var i uint if orig_params.distance_postfix_bits == new_params.distance_postfix_bits && orig_params.num_direct_distance_codes == new_params.num_direct_distance_codes { return } for i = 0; i < num_commands; i++ { var cmd *command = &cmds[i] if commandCopyLen(cmd) != 0 && cmd.cmd_prefix_ >= 128 { prefixEncodeCopyDistance(uint(commandRestoreDistanceCode(cmd, orig_params)), uint(new_params.num_direct_distance_codes), uint(new_params.distance_postfix_bits), &cmd.dist_prefix_, &cmd.dist_extra_) } } } func computeDistanceCost(cmds []command, num_commands uint, orig_params *distanceParams, new_params *distanceParams, cost *float64) bool { var i uint var equal_params bool = false var dist_prefix uint16 var dist_extra uint32 var extra_bits float64 = 0.0 var histo histogramDistance histogramClearDistance(&histo) if orig_params.distance_postfix_bits == new_params.distance_postfix_bits && orig_params.num_direct_distance_codes == new_params.num_direct_distance_codes { equal_params = true } for i = 0; i < num_commands; i++ { var cmd *command = &cmds[i] if commandCopyLen(cmd) != 0 && cmd.cmd_prefix_ >= 128 { if equal_params { dist_prefix = cmd.dist_prefix_ } else { var distance uint32 = commandRestoreDistanceCode(cmd, orig_params) if distance > uint32(new_params.max_distance) { return false } prefixEncodeCopyDistance(uint(distance), uint(new_params.num_direct_distance_codes), uint(new_params.distance_postfix_bits), &dist_prefix, &dist_extra) } histogramAddDistance(&histo, uint(dist_prefix)&0x3FF) extra_bits += float64(dist_prefix >> 10) } } *cost = populationCostDistance(&histo) + extra_bits return true } var buildMetaBlock_kMaxNumberOfHistograms uint = 256 func buildMetaBlock(ringbuffer []byte, pos uint, mask uint, params *encoderParams, prev_byte byte, prev_byte2 byte, cmds []command, num_commands uint, literal_context_mode int, mb *metaBlockSplit) { var distance_histograms []histogramDistance var literal_histograms []histogramLiteral var literal_context_modes []int = nil var literal_histograms_size uint var distance_histograms_size uint var i uint var literal_context_multiplier uint = 1 var npostfix uint32 var ndirect_msb uint32 = 0 var check_orig bool = true var best_dist_cost float64 = 1e99 var orig_params encoderParams = *params /* Histogram ids need to fit in one byte. */ var new_params encoderParams = *params for npostfix = 0; npostfix <= maxNpostfix; npostfix++ { for ; ndirect_msb < 16; ndirect_msb++ { var ndirect uint32 = ndirect_msb << npostfix var skip bool var dist_cost float64 initDistanceParams(&new_params, npostfix, ndirect) if npostfix == orig_params.dist.distance_postfix_bits && ndirect == orig_params.dist.num_direct_distance_codes { check_orig = false } skip = !computeDistanceCost(cmds, num_commands, &orig_params.dist, &new_params.dist, &dist_cost) if skip || (dist_cost > best_dist_cost) { break } best_dist_cost = dist_cost params.dist = new_params.dist } if ndirect_msb > 0 { ndirect_msb-- } ndirect_msb /= 2 } if check_orig { var dist_cost float64 computeDistanceCost(cmds, num_commands, &orig_params.dist, &orig_params.dist, &dist_cost) if dist_cost < best_dist_cost { /* NB: currently unused; uncomment when more param tuning is added. */ /* best_dist_cost = dist_cost; */ params.dist = orig_params.dist } } recomputeDistancePrefixes(cmds, num_commands, &orig_params.dist, ¶ms.dist) splitBlock(cmds, num_commands, ringbuffer, pos, mask, params, &mb.literal_split, &mb.command_split, &mb.distance_split) if !params.disable_literal_context_modeling { literal_context_multiplier = 1 << literalContextBits literal_context_modes = make([]int, (mb.literal_split.num_types)) for i = 0; i < mb.literal_split.num_types; i++ { literal_context_modes[i] = literal_context_mode } } literal_histograms_size = mb.literal_split.num_types * literal_context_multiplier literal_histograms = make([]histogramLiteral, literal_histograms_size) clearHistogramsLiteral(literal_histograms, literal_histograms_size) distance_histograms_size = mb.distance_split.num_types << distanceContextBits distance_histograms = make([]histogramDistance, distance_histograms_size) clearHistogramsDistance(distance_histograms, distance_histograms_size) assert(mb.command_histograms == nil) mb.command_histograms_size = mb.command_split.num_types mb.command_histograms = make([]histogramCommand, (mb.command_histograms_size)) clearHistogramsCommand(mb.command_histograms, mb.command_histograms_size) buildHistogramsWithContext(cmds, num_commands, &mb.literal_split, &mb.command_split, &mb.distance_split, ringbuffer, pos, mask, prev_byte, prev_byte2, literal_context_modes, literal_histograms, mb.command_histograms, distance_histograms) literal_context_modes = nil assert(mb.literal_context_map == nil) mb.literal_context_map_size = mb.literal_split.num_types << literalContextBits mb.literal_context_map = make([]uint32, (mb.literal_context_map_size)) assert(mb.literal_histograms == nil) mb.literal_histograms_size = mb.literal_context_map_size mb.literal_histograms = make([]histogramLiteral, (mb.literal_histograms_size)) clusterHistogramsLiteral(literal_histograms, literal_histograms_size, buildMetaBlock_kMaxNumberOfHistograms, mb.literal_histograms, &mb.literal_histograms_size, mb.literal_context_map) literal_histograms = nil if params.disable_literal_context_modeling { /* Distribute assignment to all contexts. */ for i = mb.literal_split.num_types; i != 0; { var j uint = 0 i-- for ; j < 1< 0 { var entropy [maxStaticContexts]float64 var combined_histo []histogramLiteral = make([]histogramLiteral, (2 * num_contexts)) var combined_entropy [2 * maxStaticContexts]float64 var diff = [2]float64{0.0} /* Try merging the set of histograms for the current block type with the respective set of histograms for the last and second last block types. Decide over the split based on the total reduction of entropy across all contexts. */ var i uint for i = 0; i < num_contexts; i++ { var curr_histo_ix uint = self.curr_histogram_ix_ + i var j uint entropy[i] = bitsEntropy(histograms[curr_histo_ix].data_[:], self.alphabet_size_) for j = 0; j < 2; j++ { var jx uint = j*num_contexts + i var last_histogram_ix uint = self.last_histogram_ix_[j] + i combined_histo[jx] = histograms[curr_histo_ix] histogramAddHistogramLiteral(&combined_histo[jx], &histograms[last_histogram_ix]) combined_entropy[jx] = bitsEntropy(combined_histo[jx].data_[0:], self.alphabet_size_) diff[j] += combined_entropy[jx] - entropy[i] - last_entropy[jx] } } if split.num_types < self.max_block_types_ && diff[0] > self.split_threshold_ && diff[1] > self.split_threshold_ { /* Create new block. */ split.lengths[self.num_blocks_] = uint32(self.block_size_) split.types[self.num_blocks_] = byte(split.num_types) self.last_histogram_ix_[1] = self.last_histogram_ix_[0] self.last_histogram_ix_[0] = split.num_types * num_contexts for i = 0; i < num_contexts; i++ { last_entropy[num_contexts+i] = last_entropy[i] last_entropy[i] = entropy[i] } self.num_blocks_++ split.num_types++ self.curr_histogram_ix_ += num_contexts if self.curr_histogram_ix_ < *self.histograms_size_ { clearHistogramsLiteral(self.histograms_[self.curr_histogram_ix_:], self.num_contexts_) } self.block_size_ = 0 self.merge_last_count_ = 0 self.target_block_size_ = self.min_block_size_ } else if diff[1] < diff[0]-20.0 { split.lengths[self.num_blocks_] = uint32(self.block_size_) split.types[self.num_blocks_] = split.types[self.num_blocks_-2] /* Combine this block with second last block. */ var tmp uint = self.last_histogram_ix_[0] self.last_histogram_ix_[0] = self.last_histogram_ix_[1] self.last_histogram_ix_[1] = tmp for i = 0; i < num_contexts; i++ { histograms[self.last_histogram_ix_[0]+i] = combined_histo[num_contexts+i] last_entropy[num_contexts+i] = last_entropy[i] last_entropy[i] = combined_entropy[num_contexts+i] histogramClearLiteral(&histograms[self.curr_histogram_ix_+i]) } self.num_blocks_++ self.block_size_ = 0 self.merge_last_count_ = 0 self.target_block_size_ = self.min_block_size_ } else { /* Combine this block with last block. */ split.lengths[self.num_blocks_-1] += uint32(self.block_size_) for i = 0; i < num_contexts; i++ { histograms[self.last_histogram_ix_[0]+i] = combined_histo[i] last_entropy[i] = combined_entropy[i] if split.num_types == 1 { last_entropy[num_contexts+i] = last_entropy[i] } histogramClearLiteral(&histograms[self.curr_histogram_ix_+i]) } self.block_size_ = 0 self.merge_last_count_++ if self.merge_last_count_ > 1 { self.target_block_size_ += self.min_block_size_ } } combined_histo = nil } if is_final { *self.histograms_size_ = split.num_types * num_contexts split.num_blocks = self.num_blocks_ } } /* Adds the next symbol to the current block type and context. When the current block reaches the target size, decides on merging the block. */ func contextBlockSplitterAddSymbol(self *contextBlockSplitter, symbol uint, context uint) { histogramAddLiteral(&self.histograms_[self.curr_histogram_ix_+context], symbol) self.block_size_++ if self.block_size_ == self.target_block_size_ { contextBlockSplitterFinishBlock(self, false) /* is_final = */ } } func mapStaticContexts(num_contexts uint, static_context_map []uint32, mb *metaBlockSplit) { var i uint assert(mb.literal_context_map == nil) mb.literal_context_map_size = mb.literal_split.num_types << literalContextBits mb.literal_context_map = make([]uint32, (mb.literal_context_map_size)) for i = 0; i < mb.literal_split.num_types; i++ { var offset uint32 = uint32(i * num_contexts) var j uint for j = 0; j < 1<= 128 { blockSplitterAddSymbolDistance(&dist_blocks, uint(cmd.dist_prefix_)&0x3FF) } } } if num_contexts == 1 { blockSplitterFinishBlockLiteral(&lit_blocks.plain, true) /* is_final = */ } else { contextBlockSplitterFinishBlock(&lit_blocks.ctx, true) /* is_final = */ } blockSplitterFinishBlockCommand(&cmd_blocks, true) /* is_final = */ blockSplitterFinishBlockDistance(&dist_blocks, true) /* is_final = */ if num_contexts > 1 { mapStaticContexts(num_contexts, static_context_map, mb) } } func buildMetaBlockGreedy(ringbuffer []byte, pos uint, mask uint, prev_byte byte, prev_byte2 byte, literal_context_lut contextLUT, num_contexts uint, static_context_map []uint32, commands []command, n_commands uint, mb *metaBlockSplit) { if num_contexts == 1 { buildMetaBlockGreedyInternal(ringbuffer, pos, mask, prev_byte, prev_byte2, literal_context_lut, 1, nil, commands, n_commands, mb) } else { buildMetaBlockGreedyInternal(ringbuffer, pos, mask, prev_byte, prev_byte2, literal_context_lut, num_contexts, static_context_map, commands, n_commands, mb) } } func optimizeHistograms(num_distance_codes uint32, mb *metaBlockSplit) { var good_for_rle [numCommandSymbols]byte var i uint for i = 0; i < mb.literal_histograms_size; i++ { optimizeHuffmanCountsForRLE(256, mb.literal_histograms[i].data_[:], good_for_rle[:]) } for i = 0; i < mb.command_histograms_size; i++ { optimizeHuffmanCountsForRLE(numCommandSymbols, mb.command_histograms[i].data_[:], good_for_rle[:]) } for i = 0; i < mb.distance_histograms_size; i++ { optimizeHuffmanCountsForRLE(uint(num_distance_codes), mb.distance_histograms[i].data_[:], good_for_rle[:]) } }