1 | package brotli
|
---|
2 |
|
---|
3 | import (
|
---|
4 | "sync"
|
---|
5 | )
|
---|
6 |
|
---|
7 | /* Copyright 2014 Google Inc. All Rights Reserved.
|
---|
8 |
|
---|
9 | Distributed under MIT license.
|
---|
10 | See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
|
---|
11 | */
|
---|
12 |
|
---|
13 | /* Algorithms for distributing the literals and commands of a metablock between
|
---|
14 | block types and contexts. */
|
---|
15 |
|
---|
16 | type metaBlockSplit struct {
|
---|
17 | literal_split blockSplit
|
---|
18 | command_split blockSplit
|
---|
19 | distance_split blockSplit
|
---|
20 | literal_context_map []uint32
|
---|
21 | literal_context_map_size uint
|
---|
22 | distance_context_map []uint32
|
---|
23 | distance_context_map_size uint
|
---|
24 | literal_histograms []histogramLiteral
|
---|
25 | literal_histograms_size uint
|
---|
26 | command_histograms []histogramCommand
|
---|
27 | command_histograms_size uint
|
---|
28 | distance_histograms []histogramDistance
|
---|
29 | distance_histograms_size uint
|
---|
30 | }
|
---|
31 |
|
---|
32 | var metaBlockPool sync.Pool
|
---|
33 |
|
---|
34 | func getMetaBlockSplit() *metaBlockSplit {
|
---|
35 | mb, _ := metaBlockPool.Get().(*metaBlockSplit)
|
---|
36 |
|
---|
37 | if mb == nil {
|
---|
38 | mb = &metaBlockSplit{}
|
---|
39 | } else {
|
---|
40 | initBlockSplit(&mb.literal_split)
|
---|
41 | initBlockSplit(&mb.command_split)
|
---|
42 | initBlockSplit(&mb.distance_split)
|
---|
43 | mb.literal_context_map = mb.literal_context_map[:0]
|
---|
44 | mb.literal_context_map_size = 0
|
---|
45 | mb.distance_context_map = mb.distance_context_map[:0]
|
---|
46 | mb.distance_context_map_size = 0
|
---|
47 | mb.literal_histograms = mb.literal_histograms[:0]
|
---|
48 | mb.command_histograms = mb.command_histograms[:0]
|
---|
49 | mb.distance_histograms = mb.distance_histograms[:0]
|
---|
50 | }
|
---|
51 | return mb
|
---|
52 | }
|
---|
53 |
|
---|
54 | func freeMetaBlockSplit(mb *metaBlockSplit) {
|
---|
55 | metaBlockPool.Put(mb)
|
---|
56 | }
|
---|
57 |
|
---|
58 | func initDistanceParams(params *encoderParams, npostfix uint32, ndirect uint32) {
|
---|
59 | var dist_params *distanceParams = ¶ms.dist
|
---|
60 | var alphabet_size uint32
|
---|
61 | var max_distance uint32
|
---|
62 |
|
---|
63 | dist_params.distance_postfix_bits = npostfix
|
---|
64 | dist_params.num_direct_distance_codes = ndirect
|
---|
65 |
|
---|
66 | alphabet_size = uint32(distanceAlphabetSize(uint(npostfix), uint(ndirect), maxDistanceBits))
|
---|
67 | max_distance = ndirect + (1 << (maxDistanceBits + npostfix + 2)) - (1 << (npostfix + 2))
|
---|
68 |
|
---|
69 | if params.large_window {
|
---|
70 | var bound = [maxNpostfix + 1]uint32{0, 4, 12, 28}
|
---|
71 | var postfix uint32 = 1 << npostfix
|
---|
72 | alphabet_size = uint32(distanceAlphabetSize(uint(npostfix), uint(ndirect), largeMaxDistanceBits))
|
---|
73 |
|
---|
74 | /* The maximum distance is set so that no distance symbol used can encode
|
---|
75 | a distance larger than BROTLI_MAX_ALLOWED_DISTANCE with all
|
---|
76 | its extra bits set. */
|
---|
77 | if ndirect < bound[npostfix] {
|
---|
78 | max_distance = maxAllowedDistance - (bound[npostfix] - ndirect)
|
---|
79 | } else if ndirect >= bound[npostfix]+postfix {
|
---|
80 | max_distance = (3 << 29) - 4 + (ndirect - bound[npostfix])
|
---|
81 | } else {
|
---|
82 | max_distance = maxAllowedDistance
|
---|
83 | }
|
---|
84 | }
|
---|
85 |
|
---|
86 | dist_params.alphabet_size = alphabet_size
|
---|
87 | dist_params.max_distance = uint(max_distance)
|
---|
88 | }
|
---|
89 |
|
---|
90 | func recomputeDistancePrefixes(cmds []command, orig_params *distanceParams, new_params *distanceParams) {
|
---|
91 | if orig_params.distance_postfix_bits == new_params.distance_postfix_bits && orig_params.num_direct_distance_codes == new_params.num_direct_distance_codes {
|
---|
92 | return
|
---|
93 | }
|
---|
94 |
|
---|
95 | for i := range cmds {
|
---|
96 | var cmd *command = &cmds[i]
|
---|
97 | if commandCopyLen(cmd) != 0 && cmd.cmd_prefix_ >= 128 {
|
---|
98 | prefixEncodeCopyDistance(uint(commandRestoreDistanceCode(cmd, orig_params)), uint(new_params.num_direct_distance_codes), uint(new_params.distance_postfix_bits), &cmd.dist_prefix_, &cmd.dist_extra_)
|
---|
99 | }
|
---|
100 | }
|
---|
101 | }
|
---|
102 |
|
---|
103 | func computeDistanceCost(cmds []command, orig_params *distanceParams, new_params *distanceParams, cost *float64) bool {
|
---|
104 | var equal_params bool = false
|
---|
105 | var dist_prefix uint16
|
---|
106 | var dist_extra uint32
|
---|
107 | var extra_bits float64 = 0.0
|
---|
108 | var histo histogramDistance
|
---|
109 | histogramClearDistance(&histo)
|
---|
110 |
|
---|
111 | if orig_params.distance_postfix_bits == new_params.distance_postfix_bits && orig_params.num_direct_distance_codes == new_params.num_direct_distance_codes {
|
---|
112 | equal_params = true
|
---|
113 | }
|
---|
114 |
|
---|
115 | for i := range cmds {
|
---|
116 | cmd := &cmds[i]
|
---|
117 | if commandCopyLen(cmd) != 0 && cmd.cmd_prefix_ >= 128 {
|
---|
118 | if equal_params {
|
---|
119 | dist_prefix = cmd.dist_prefix_
|
---|
120 | } else {
|
---|
121 | var distance uint32 = commandRestoreDistanceCode(cmd, orig_params)
|
---|
122 | if distance > uint32(new_params.max_distance) {
|
---|
123 | return false
|
---|
124 | }
|
---|
125 |
|
---|
126 | prefixEncodeCopyDistance(uint(distance), uint(new_params.num_direct_distance_codes), uint(new_params.distance_postfix_bits), &dist_prefix, &dist_extra)
|
---|
127 | }
|
---|
128 |
|
---|
129 | histogramAddDistance(&histo, uint(dist_prefix)&0x3FF)
|
---|
130 | extra_bits += float64(dist_prefix >> 10)
|
---|
131 | }
|
---|
132 | }
|
---|
133 |
|
---|
134 | *cost = populationCostDistance(&histo) + extra_bits
|
---|
135 | return true
|
---|
136 | }
|
---|
137 |
|
---|
138 | var buildMetaBlock_kMaxNumberOfHistograms uint = 256
|
---|
139 |
|
---|
140 | func buildMetaBlock(ringbuffer []byte, pos uint, mask uint, params *encoderParams, prev_byte byte, prev_byte2 byte, cmds []command, literal_context_mode int, mb *metaBlockSplit) {
|
---|
141 | var distance_histograms []histogramDistance
|
---|
142 | var literal_histograms []histogramLiteral
|
---|
143 | var literal_context_modes []int = nil
|
---|
144 | var literal_histograms_size uint
|
---|
145 | var distance_histograms_size uint
|
---|
146 | var i uint
|
---|
147 | var literal_context_multiplier uint = 1
|
---|
148 | var npostfix uint32
|
---|
149 | var ndirect_msb uint32 = 0
|
---|
150 | var check_orig bool = true
|
---|
151 | var best_dist_cost float64 = 1e99
|
---|
152 | var orig_params encoderParams = *params
|
---|
153 | /* Histogram ids need to fit in one byte. */
|
---|
154 |
|
---|
155 | var new_params encoderParams = *params
|
---|
156 |
|
---|
157 | for npostfix = 0; npostfix <= maxNpostfix; npostfix++ {
|
---|
158 | for ; ndirect_msb < 16; ndirect_msb++ {
|
---|
159 | var ndirect uint32 = ndirect_msb << npostfix
|
---|
160 | var skip bool
|
---|
161 | var dist_cost float64
|
---|
162 | initDistanceParams(&new_params, npostfix, ndirect)
|
---|
163 | if npostfix == orig_params.dist.distance_postfix_bits && ndirect == orig_params.dist.num_direct_distance_codes {
|
---|
164 | check_orig = false
|
---|
165 | }
|
---|
166 |
|
---|
167 | skip = !computeDistanceCost(cmds, &orig_params.dist, &new_params.dist, &dist_cost)
|
---|
168 | if skip || (dist_cost > best_dist_cost) {
|
---|
169 | break
|
---|
170 | }
|
---|
171 |
|
---|
172 | best_dist_cost = dist_cost
|
---|
173 | params.dist = new_params.dist
|
---|
174 | }
|
---|
175 |
|
---|
176 | if ndirect_msb > 0 {
|
---|
177 | ndirect_msb--
|
---|
178 | }
|
---|
179 | ndirect_msb /= 2
|
---|
180 | }
|
---|
181 |
|
---|
182 | if check_orig {
|
---|
183 | var dist_cost float64
|
---|
184 | computeDistanceCost(cmds, &orig_params.dist, &orig_params.dist, &dist_cost)
|
---|
185 | if dist_cost < best_dist_cost {
|
---|
186 | /* NB: currently unused; uncomment when more param tuning is added. */
|
---|
187 | /* best_dist_cost = dist_cost; */
|
---|
188 | params.dist = orig_params.dist
|
---|
189 | }
|
---|
190 | }
|
---|
191 |
|
---|
192 | recomputeDistancePrefixes(cmds, &orig_params.dist, ¶ms.dist)
|
---|
193 |
|
---|
194 | splitBlock(cmds, ringbuffer, pos, mask, params, &mb.literal_split, &mb.command_split, &mb.distance_split)
|
---|
195 |
|
---|
196 | if !params.disable_literal_context_modeling {
|
---|
197 | literal_context_multiplier = 1 << literalContextBits
|
---|
198 | literal_context_modes = make([]int, (mb.literal_split.num_types))
|
---|
199 | for i = 0; i < mb.literal_split.num_types; i++ {
|
---|
200 | literal_context_modes[i] = literal_context_mode
|
---|
201 | }
|
---|
202 | }
|
---|
203 |
|
---|
204 | literal_histograms_size = mb.literal_split.num_types * literal_context_multiplier
|
---|
205 | literal_histograms = make([]histogramLiteral, literal_histograms_size)
|
---|
206 | clearHistogramsLiteral(literal_histograms, literal_histograms_size)
|
---|
207 |
|
---|
208 | distance_histograms_size = mb.distance_split.num_types << distanceContextBits
|
---|
209 | distance_histograms = make([]histogramDistance, distance_histograms_size)
|
---|
210 | clearHistogramsDistance(distance_histograms, distance_histograms_size)
|
---|
211 |
|
---|
212 | mb.command_histograms_size = mb.command_split.num_types
|
---|
213 | if cap(mb.command_histograms) < int(mb.command_histograms_size) {
|
---|
214 | mb.command_histograms = make([]histogramCommand, (mb.command_histograms_size))
|
---|
215 | } else {
|
---|
216 | mb.command_histograms = mb.command_histograms[:mb.command_histograms_size]
|
---|
217 | }
|
---|
218 | clearHistogramsCommand(mb.command_histograms, mb.command_histograms_size)
|
---|
219 |
|
---|
220 | buildHistogramsWithContext(cmds, &mb.literal_split, &mb.command_split, &mb.distance_split, ringbuffer, pos, mask, prev_byte, prev_byte2, literal_context_modes, literal_histograms, mb.command_histograms, distance_histograms)
|
---|
221 | literal_context_modes = nil
|
---|
222 |
|
---|
223 | mb.literal_context_map_size = mb.literal_split.num_types << literalContextBits
|
---|
224 | if cap(mb.literal_context_map) < int(mb.literal_context_map_size) {
|
---|
225 | mb.literal_context_map = make([]uint32, (mb.literal_context_map_size))
|
---|
226 | } else {
|
---|
227 | mb.literal_context_map = mb.literal_context_map[:mb.literal_context_map_size]
|
---|
228 | }
|
---|
229 |
|
---|
230 | mb.literal_histograms_size = mb.literal_context_map_size
|
---|
231 | if cap(mb.literal_histograms) < int(mb.literal_histograms_size) {
|
---|
232 | mb.literal_histograms = make([]histogramLiteral, (mb.literal_histograms_size))
|
---|
233 | } else {
|
---|
234 | mb.literal_histograms = mb.literal_histograms[:mb.literal_histograms_size]
|
---|
235 | }
|
---|
236 |
|
---|
237 | clusterHistogramsLiteral(literal_histograms, literal_histograms_size, buildMetaBlock_kMaxNumberOfHistograms, mb.literal_histograms, &mb.literal_histograms_size, mb.literal_context_map)
|
---|
238 | literal_histograms = nil
|
---|
239 |
|
---|
240 | if params.disable_literal_context_modeling {
|
---|
241 | /* Distribute assignment to all contexts. */
|
---|
242 | for i = mb.literal_split.num_types; i != 0; {
|
---|
243 | var j uint = 0
|
---|
244 | i--
|
---|
245 | for ; j < 1<<literalContextBits; j++ {
|
---|
246 | mb.literal_context_map[(i<<literalContextBits)+j] = mb.literal_context_map[i]
|
---|
247 | }
|
---|
248 | }
|
---|
249 | }
|
---|
250 |
|
---|
251 | mb.distance_context_map_size = mb.distance_split.num_types << distanceContextBits
|
---|
252 | if cap(mb.distance_context_map) < int(mb.distance_context_map_size) {
|
---|
253 | mb.distance_context_map = make([]uint32, (mb.distance_context_map_size))
|
---|
254 | } else {
|
---|
255 | mb.distance_context_map = mb.distance_context_map[:mb.distance_context_map_size]
|
---|
256 | }
|
---|
257 |
|
---|
258 | mb.distance_histograms_size = mb.distance_context_map_size
|
---|
259 | if cap(mb.distance_histograms) < int(mb.distance_histograms_size) {
|
---|
260 | mb.distance_histograms = make([]histogramDistance, (mb.distance_histograms_size))
|
---|
261 | } else {
|
---|
262 | mb.distance_histograms = mb.distance_histograms[:mb.distance_histograms_size]
|
---|
263 | }
|
---|
264 |
|
---|
265 | clusterHistogramsDistance(distance_histograms, mb.distance_context_map_size, buildMetaBlock_kMaxNumberOfHistograms, mb.distance_histograms, &mb.distance_histograms_size, mb.distance_context_map)
|
---|
266 | distance_histograms = nil
|
---|
267 | }
|
---|
268 |
|
---|
269 | const maxStaticContexts = 13
|
---|
270 |
|
---|
271 | /* Greedy block splitter for one block category (literal, command or distance).
|
---|
272 | Gathers histograms for all context buckets. */
|
---|
273 | type contextBlockSplitter struct {
|
---|
274 | alphabet_size_ uint
|
---|
275 | num_contexts_ uint
|
---|
276 | max_block_types_ uint
|
---|
277 | min_block_size_ uint
|
---|
278 | split_threshold_ float64
|
---|
279 | num_blocks_ uint
|
---|
280 | split_ *blockSplit
|
---|
281 | histograms_ []histogramLiteral
|
---|
282 | histograms_size_ *uint
|
---|
283 | target_block_size_ uint
|
---|
284 | block_size_ uint
|
---|
285 | curr_histogram_ix_ uint
|
---|
286 | last_histogram_ix_ [2]uint
|
---|
287 | last_entropy_ [2 * maxStaticContexts]float64
|
---|
288 | merge_last_count_ uint
|
---|
289 | }
|
---|
290 |
|
---|
291 | func initContextBlockSplitter(self *contextBlockSplitter, alphabet_size uint, num_contexts uint, min_block_size uint, split_threshold float64, num_symbols uint, split *blockSplit, histograms *[]histogramLiteral, histograms_size *uint) {
|
---|
292 | var max_num_blocks uint = num_symbols/min_block_size + 1
|
---|
293 | var max_num_types uint
|
---|
294 | assert(num_contexts <= maxStaticContexts)
|
---|
295 |
|
---|
296 | self.alphabet_size_ = alphabet_size
|
---|
297 | self.num_contexts_ = num_contexts
|
---|
298 | self.max_block_types_ = maxNumberOfBlockTypes / num_contexts
|
---|
299 | self.min_block_size_ = min_block_size
|
---|
300 | self.split_threshold_ = split_threshold
|
---|
301 | self.num_blocks_ = 0
|
---|
302 | self.split_ = split
|
---|
303 | self.histograms_size_ = histograms_size
|
---|
304 | self.target_block_size_ = min_block_size
|
---|
305 | self.block_size_ = 0
|
---|
306 | self.curr_histogram_ix_ = 0
|
---|
307 | self.merge_last_count_ = 0
|
---|
308 |
|
---|
309 | /* We have to allocate one more histogram than the maximum number of block
|
---|
310 | types for the current histogram when the meta-block is too big. */
|
---|
311 | max_num_types = brotli_min_size_t(max_num_blocks, self.max_block_types_+1)
|
---|
312 |
|
---|
313 | brotli_ensure_capacity_uint8_t(&split.types, &split.types_alloc_size, max_num_blocks)
|
---|
314 | brotli_ensure_capacity_uint32_t(&split.lengths, &split.lengths_alloc_size, max_num_blocks)
|
---|
315 | split.num_blocks = max_num_blocks
|
---|
316 | *histograms_size = max_num_types * num_contexts
|
---|
317 | if histograms == nil || cap(*histograms) < int(*histograms_size) {
|
---|
318 | *histograms = make([]histogramLiteral, (*histograms_size))
|
---|
319 | } else {
|
---|
320 | *histograms = (*histograms)[:*histograms_size]
|
---|
321 | }
|
---|
322 | self.histograms_ = *histograms
|
---|
323 |
|
---|
324 | /* Clear only current histogram. */
|
---|
325 | clearHistogramsLiteral(self.histograms_[0:], num_contexts)
|
---|
326 |
|
---|
327 | self.last_histogram_ix_[1] = 0
|
---|
328 | self.last_histogram_ix_[0] = self.last_histogram_ix_[1]
|
---|
329 | }
|
---|
330 |
|
---|
331 | /* Does either of three things:
|
---|
332 | (1) emits the current block with a new block type;
|
---|
333 | (2) emits the current block with the type of the second last block;
|
---|
334 | (3) merges the current block with the last block. */
|
---|
335 | func contextBlockSplitterFinishBlock(self *contextBlockSplitter, is_final bool) {
|
---|
336 | var split *blockSplit = self.split_
|
---|
337 | var num_contexts uint = self.num_contexts_
|
---|
338 | var last_entropy []float64 = self.last_entropy_[:]
|
---|
339 | var histograms []histogramLiteral = self.histograms_
|
---|
340 |
|
---|
341 | if self.block_size_ < self.min_block_size_ {
|
---|
342 | self.block_size_ = self.min_block_size_
|
---|
343 | }
|
---|
344 |
|
---|
345 | if self.num_blocks_ == 0 {
|
---|
346 | var i uint
|
---|
347 |
|
---|
348 | /* Create first block. */
|
---|
349 | split.lengths[0] = uint32(self.block_size_)
|
---|
350 |
|
---|
351 | split.types[0] = 0
|
---|
352 |
|
---|
353 | for i = 0; i < num_contexts; i++ {
|
---|
354 | last_entropy[i] = bitsEntropy(histograms[i].data_[:], self.alphabet_size_)
|
---|
355 | last_entropy[num_contexts+i] = last_entropy[i]
|
---|
356 | }
|
---|
357 |
|
---|
358 | self.num_blocks_++
|
---|
359 | split.num_types++
|
---|
360 | self.curr_histogram_ix_ += num_contexts
|
---|
361 | if self.curr_histogram_ix_ < *self.histograms_size_ {
|
---|
362 | clearHistogramsLiteral(self.histograms_[self.curr_histogram_ix_:], self.num_contexts_)
|
---|
363 | }
|
---|
364 |
|
---|
365 | self.block_size_ = 0
|
---|
366 | } else if self.block_size_ > 0 {
|
---|
367 | var entropy [maxStaticContexts]float64
|
---|
368 | var combined_histo []histogramLiteral = make([]histogramLiteral, (2 * num_contexts))
|
---|
369 | var combined_entropy [2 * maxStaticContexts]float64
|
---|
370 | var diff = [2]float64{0.0}
|
---|
371 | /* Try merging the set of histograms for the current block type with the
|
---|
372 | respective set of histograms for the last and second last block types.
|
---|
373 | Decide over the split based on the total reduction of entropy across
|
---|
374 | all contexts. */
|
---|
375 |
|
---|
376 | var i uint
|
---|
377 | for i = 0; i < num_contexts; i++ {
|
---|
378 | var curr_histo_ix uint = self.curr_histogram_ix_ + i
|
---|
379 | var j uint
|
---|
380 | entropy[i] = bitsEntropy(histograms[curr_histo_ix].data_[:], self.alphabet_size_)
|
---|
381 | for j = 0; j < 2; j++ {
|
---|
382 | var jx uint = j*num_contexts + i
|
---|
383 | var last_histogram_ix uint = self.last_histogram_ix_[j] + i
|
---|
384 | combined_histo[jx] = histograms[curr_histo_ix]
|
---|
385 | histogramAddHistogramLiteral(&combined_histo[jx], &histograms[last_histogram_ix])
|
---|
386 | combined_entropy[jx] = bitsEntropy(combined_histo[jx].data_[0:], self.alphabet_size_)
|
---|
387 | diff[j] += combined_entropy[jx] - entropy[i] - last_entropy[jx]
|
---|
388 | }
|
---|
389 | }
|
---|
390 |
|
---|
391 | if split.num_types < self.max_block_types_ && diff[0] > self.split_threshold_ && diff[1] > self.split_threshold_ {
|
---|
392 | /* Create new block. */
|
---|
393 | split.lengths[self.num_blocks_] = uint32(self.block_size_)
|
---|
394 |
|
---|
395 | split.types[self.num_blocks_] = byte(split.num_types)
|
---|
396 | self.last_histogram_ix_[1] = self.last_histogram_ix_[0]
|
---|
397 | self.last_histogram_ix_[0] = split.num_types * num_contexts
|
---|
398 | for i = 0; i < num_contexts; i++ {
|
---|
399 | last_entropy[num_contexts+i] = last_entropy[i]
|
---|
400 | last_entropy[i] = entropy[i]
|
---|
401 | }
|
---|
402 |
|
---|
403 | self.num_blocks_++
|
---|
404 | split.num_types++
|
---|
405 | self.curr_histogram_ix_ += num_contexts
|
---|
406 | if self.curr_histogram_ix_ < *self.histograms_size_ {
|
---|
407 | clearHistogramsLiteral(self.histograms_[self.curr_histogram_ix_:], self.num_contexts_)
|
---|
408 | }
|
---|
409 |
|
---|
410 | self.block_size_ = 0
|
---|
411 | self.merge_last_count_ = 0
|
---|
412 | self.target_block_size_ = self.min_block_size_
|
---|
413 | } else if diff[1] < diff[0]-20.0 {
|
---|
414 | split.lengths[self.num_blocks_] = uint32(self.block_size_)
|
---|
415 | split.types[self.num_blocks_] = split.types[self.num_blocks_-2]
|
---|
416 | /* Combine this block with second last block. */
|
---|
417 |
|
---|
418 | var tmp uint = self.last_histogram_ix_[0]
|
---|
419 | self.last_histogram_ix_[0] = self.last_histogram_ix_[1]
|
---|
420 | self.last_histogram_ix_[1] = tmp
|
---|
421 | for i = 0; i < num_contexts; i++ {
|
---|
422 | histograms[self.last_histogram_ix_[0]+i] = combined_histo[num_contexts+i]
|
---|
423 | last_entropy[num_contexts+i] = last_entropy[i]
|
---|
424 | last_entropy[i] = combined_entropy[num_contexts+i]
|
---|
425 | histogramClearLiteral(&histograms[self.curr_histogram_ix_+i])
|
---|
426 | }
|
---|
427 |
|
---|
428 | self.num_blocks_++
|
---|
429 | self.block_size_ = 0
|
---|
430 | self.merge_last_count_ = 0
|
---|
431 | self.target_block_size_ = self.min_block_size_
|
---|
432 | } else {
|
---|
433 | /* Combine this block with last block. */
|
---|
434 | split.lengths[self.num_blocks_-1] += uint32(self.block_size_)
|
---|
435 |
|
---|
436 | for i = 0; i < num_contexts; i++ {
|
---|
437 | histograms[self.last_histogram_ix_[0]+i] = combined_histo[i]
|
---|
438 | last_entropy[i] = combined_entropy[i]
|
---|
439 | if split.num_types == 1 {
|
---|
440 | last_entropy[num_contexts+i] = last_entropy[i]
|
---|
441 | }
|
---|
442 |
|
---|
443 | histogramClearLiteral(&histograms[self.curr_histogram_ix_+i])
|
---|
444 | }
|
---|
445 |
|
---|
446 | self.block_size_ = 0
|
---|
447 | self.merge_last_count_++
|
---|
448 | if self.merge_last_count_ > 1 {
|
---|
449 | self.target_block_size_ += self.min_block_size_
|
---|
450 | }
|
---|
451 | }
|
---|
452 |
|
---|
453 | combined_histo = nil
|
---|
454 | }
|
---|
455 |
|
---|
456 | if is_final {
|
---|
457 | *self.histograms_size_ = split.num_types * num_contexts
|
---|
458 | split.num_blocks = self.num_blocks_
|
---|
459 | }
|
---|
460 | }
|
---|
461 |
|
---|
462 | /* Adds the next symbol to the current block type and context. When the
|
---|
463 | current block reaches the target size, decides on merging the block. */
|
---|
464 | func contextBlockSplitterAddSymbol(self *contextBlockSplitter, symbol uint, context uint) {
|
---|
465 | histogramAddLiteral(&self.histograms_[self.curr_histogram_ix_+context], symbol)
|
---|
466 | self.block_size_++
|
---|
467 | if self.block_size_ == self.target_block_size_ {
|
---|
468 | contextBlockSplitterFinishBlock(self, false) /* is_final = */
|
---|
469 | }
|
---|
470 | }
|
---|
471 |
|
---|
472 | func mapStaticContexts(num_contexts uint, static_context_map []uint32, mb *metaBlockSplit) {
|
---|
473 | var i uint
|
---|
474 | mb.literal_context_map_size = mb.literal_split.num_types << literalContextBits
|
---|
475 | if cap(mb.literal_context_map) < int(mb.literal_context_map_size) {
|
---|
476 | mb.literal_context_map = make([]uint32, (mb.literal_context_map_size))
|
---|
477 | } else {
|
---|
478 | mb.literal_context_map = mb.literal_context_map[:mb.literal_context_map_size]
|
---|
479 | }
|
---|
480 |
|
---|
481 | for i = 0; i < mb.literal_split.num_types; i++ {
|
---|
482 | var offset uint32 = uint32(i * num_contexts)
|
---|
483 | var j uint
|
---|
484 | for j = 0; j < 1<<literalContextBits; j++ {
|
---|
485 | mb.literal_context_map[(i<<literalContextBits)+j] = offset + static_context_map[j]
|
---|
486 | }
|
---|
487 | }
|
---|
488 | }
|
---|
489 |
|
---|
490 | func buildMetaBlockGreedyInternal(ringbuffer []byte, pos uint, mask uint, prev_byte byte, prev_byte2 byte, literal_context_lut contextLUT, num_contexts uint, static_context_map []uint32, commands []command, mb *metaBlockSplit) {
|
---|
491 | var lit_blocks struct {
|
---|
492 | plain blockSplitterLiteral
|
---|
493 | ctx contextBlockSplitter
|
---|
494 | }
|
---|
495 | var cmd_blocks blockSplitterCommand
|
---|
496 | var dist_blocks blockSplitterDistance
|
---|
497 | var num_literals uint = 0
|
---|
498 | for i := range commands {
|
---|
499 | num_literals += uint(commands[i].insert_len_)
|
---|
500 | }
|
---|
501 |
|
---|
502 | if num_contexts == 1 {
|
---|
503 | initBlockSplitterLiteral(&lit_blocks.plain, 256, 512, 400.0, num_literals, &mb.literal_split, &mb.literal_histograms, &mb.literal_histograms_size)
|
---|
504 | } else {
|
---|
505 | initContextBlockSplitter(&lit_blocks.ctx, 256, num_contexts, 512, 400.0, num_literals, &mb.literal_split, &mb.literal_histograms, &mb.literal_histograms_size)
|
---|
506 | }
|
---|
507 |
|
---|
508 | initBlockSplitterCommand(&cmd_blocks, numCommandSymbols, 1024, 500.0, uint(len(commands)), &mb.command_split, &mb.command_histograms, &mb.command_histograms_size)
|
---|
509 | initBlockSplitterDistance(&dist_blocks, 64, 512, 100.0, uint(len(commands)), &mb.distance_split, &mb.distance_histograms, &mb.distance_histograms_size)
|
---|
510 |
|
---|
511 | for _, cmd := range commands {
|
---|
512 | var j uint
|
---|
513 | blockSplitterAddSymbolCommand(&cmd_blocks, uint(cmd.cmd_prefix_))
|
---|
514 | for j = uint(cmd.insert_len_); j != 0; j-- {
|
---|
515 | var literal byte = ringbuffer[pos&mask]
|
---|
516 | if num_contexts == 1 {
|
---|
517 | blockSplitterAddSymbolLiteral(&lit_blocks.plain, uint(literal))
|
---|
518 | } else {
|
---|
519 | var context uint = uint(getContext(prev_byte, prev_byte2, literal_context_lut))
|
---|
520 | contextBlockSplitterAddSymbol(&lit_blocks.ctx, uint(literal), uint(static_context_map[context]))
|
---|
521 | }
|
---|
522 |
|
---|
523 | prev_byte2 = prev_byte
|
---|
524 | prev_byte = literal
|
---|
525 | pos++
|
---|
526 | }
|
---|
527 |
|
---|
528 | pos += uint(commandCopyLen(&cmd))
|
---|
529 | if commandCopyLen(&cmd) != 0 {
|
---|
530 | prev_byte2 = ringbuffer[(pos-2)&mask]
|
---|
531 | prev_byte = ringbuffer[(pos-1)&mask]
|
---|
532 | if cmd.cmd_prefix_ >= 128 {
|
---|
533 | blockSplitterAddSymbolDistance(&dist_blocks, uint(cmd.dist_prefix_)&0x3FF)
|
---|
534 | }
|
---|
535 | }
|
---|
536 | }
|
---|
537 |
|
---|
538 | if num_contexts == 1 {
|
---|
539 | blockSplitterFinishBlockLiteral(&lit_blocks.plain, true) /* is_final = */
|
---|
540 | } else {
|
---|
541 | contextBlockSplitterFinishBlock(&lit_blocks.ctx, true) /* is_final = */
|
---|
542 | }
|
---|
543 |
|
---|
544 | blockSplitterFinishBlockCommand(&cmd_blocks, true) /* is_final = */
|
---|
545 | blockSplitterFinishBlockDistance(&dist_blocks, true) /* is_final = */
|
---|
546 |
|
---|
547 | if num_contexts > 1 {
|
---|
548 | mapStaticContexts(num_contexts, static_context_map, mb)
|
---|
549 | }
|
---|
550 | }
|
---|
551 |
|
---|
552 | func buildMetaBlockGreedy(ringbuffer []byte, pos uint, mask uint, prev_byte byte, prev_byte2 byte, literal_context_lut contextLUT, num_contexts uint, static_context_map []uint32, commands []command, mb *metaBlockSplit) {
|
---|
553 | if num_contexts == 1 {
|
---|
554 | buildMetaBlockGreedyInternal(ringbuffer, pos, mask, prev_byte, prev_byte2, literal_context_lut, 1, nil, commands, mb)
|
---|
555 | } else {
|
---|
556 | buildMetaBlockGreedyInternal(ringbuffer, pos, mask, prev_byte, prev_byte2, literal_context_lut, num_contexts, static_context_map, commands, mb)
|
---|
557 | }
|
---|
558 | }
|
---|
559 |
|
---|
560 | func optimizeHistograms(num_distance_codes uint32, mb *metaBlockSplit) {
|
---|
561 | var good_for_rle [numCommandSymbols]byte
|
---|
562 | var i uint
|
---|
563 | for i = 0; i < mb.literal_histograms_size; i++ {
|
---|
564 | optimizeHuffmanCountsForRLE(256, mb.literal_histograms[i].data_[:], good_for_rle[:])
|
---|
565 | }
|
---|
566 |
|
---|
567 | for i = 0; i < mb.command_histograms_size; i++ {
|
---|
568 | optimizeHuffmanCountsForRLE(numCommandSymbols, mb.command_histograms[i].data_[:], good_for_rle[:])
|
---|
569 | }
|
---|
570 |
|
---|
571 | for i = 0; i < mb.distance_histograms_size; i++ {
|
---|
572 | optimizeHuffmanCountsForRLE(uint(num_distance_codes), mb.distance_histograms[i].data_[:], good_for_rle[:])
|
---|
573 | }
|
---|
574 | }
|
---|