2019-03-07 01:55:38 +03:00
|
|
|
package brotli
|
|
|
|
|
|
|
|
/* Copyright 2013 Google Inc. All Rights Reserved.
|
|
|
|
|
|
|
|
Distributed under MIT license.
|
|
|
|
See file LICENSE for detail or copy at https://opensource.org/licenses/MIT
|
|
|
|
*/
|
|
|
|
|
|
|
|
/* Block split point selection utilities. */
|
2019-03-22 01:34:30 +03:00
|
|
|
|
2019-03-15 22:05:31 +03:00
|
|
|
type blockSplit struct {
|
2019-03-07 01:55:38 +03:00
|
|
|
num_types uint
|
|
|
|
num_blocks uint
|
|
|
|
types []byte
|
|
|
|
lengths []uint32
|
|
|
|
types_alloc_size uint
|
|
|
|
lengths_alloc_size uint
|
|
|
|
}
|
|
|
|
|
2019-03-22 02:15:39 +03:00
|
|
|
const (
|
|
|
|
kMaxLiteralHistograms uint = 100
|
|
|
|
kMaxCommandHistograms uint = 50
|
|
|
|
kLiteralBlockSwitchCost float64 = 28.1
|
|
|
|
kCommandBlockSwitchCost float64 = 13.5
|
|
|
|
kDistanceBlockSwitchCost float64 = 14.6
|
|
|
|
kLiteralStrideLength uint = 70
|
|
|
|
kCommandStrideLength uint = 40
|
|
|
|
kSymbolsPerLiteralHistogram uint = 544
|
|
|
|
kSymbolsPerCommandHistogram uint = 530
|
|
|
|
kSymbolsPerDistanceHistogram uint = 544
|
|
|
|
kMinLengthForBlockSplitting uint = 128
|
|
|
|
kIterMulForRefining uint = 2
|
|
|
|
kMinItersForRefining uint = 100
|
|
|
|
)
|
2019-03-07 01:55:38 +03:00
|
|
|
|
2020-05-09 02:48:16 +03:00
|
|
|
func countLiterals(cmds []command) uint {
|
2019-03-07 01:55:38 +03:00
|
|
|
var total_length uint = 0
|
|
|
|
/* Count how many we have. */
|
|
|
|
|
2020-05-09 02:48:16 +03:00
|
|
|
for i := range cmds {
|
2019-03-07 01:55:38 +03:00
|
|
|
total_length += uint(cmds[i].insert_len_)
|
|
|
|
}
|
|
|
|
|
|
|
|
return total_length
|
|
|
|
}
|
|
|
|
|
2020-05-09 02:48:16 +03:00
|
|
|
func copyLiteralsToByteArray(cmds []command, data []byte, offset uint, mask uint, literals []byte) {
|
2019-03-07 01:55:38 +03:00
|
|
|
var pos uint = 0
|
|
|
|
var from_pos uint = offset & mask
|
2020-05-09 02:48:16 +03:00
|
|
|
for i := range cmds {
|
2019-03-07 01:55:38 +03:00
|
|
|
var insert_len uint = uint(cmds[i].insert_len_)
|
|
|
|
if from_pos+insert_len > mask {
|
|
|
|
var head_size uint = mask + 1 - from_pos
|
|
|
|
copy(literals[pos:], data[from_pos:][:head_size])
|
|
|
|
from_pos = 0
|
|
|
|
pos += head_size
|
|
|
|
insert_len -= head_size
|
|
|
|
}
|
|
|
|
|
|
|
|
if insert_len > 0 {
|
|
|
|
copy(literals[pos:], data[from_pos:][:insert_len])
|
|
|
|
pos += insert_len
|
|
|
|
}
|
|
|
|
|
2019-03-15 22:05:31 +03:00
|
|
|
from_pos = uint((uint32(from_pos+insert_len) + commandCopyLen(&cmds[i])) & uint32(mask))
|
2019-03-07 01:55:38 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-03-15 22:05:31 +03:00
|
|
|
func myRand(seed *uint32) uint32 {
|
2019-03-07 01:55:38 +03:00
|
|
|
/* Initial seed should be 7. In this case, loop length is (1 << 29). */
|
|
|
|
*seed *= 16807
|
|
|
|
|
|
|
|
return *seed
|
|
|
|
}
|
|
|
|
|
2019-03-15 22:05:31 +03:00
|
|
|
func bitCost(count uint) float64 {
|
2019-03-07 01:55:38 +03:00
|
|
|
if count == 0 {
|
|
|
|
return -2.0
|
|
|
|
} else {
|
2019-03-16 03:24:40 +03:00
|
|
|
return fastLog2(count)
|
2019-03-07 01:55:38 +03:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-03-15 22:05:31 +03:00
|
|
|
const histogramsPerBatch = 64
|
2019-03-07 01:55:38 +03:00
|
|
|
|
2019-03-15 22:05:31 +03:00
|
|
|
const clustersPerBatch = 16
|
2019-03-07 01:55:38 +03:00
|
|
|
|
2019-03-15 22:05:31 +03:00
|
|
|
func initBlockSplit(self *blockSplit) {
|
2019-03-07 01:55:38 +03:00
|
|
|
self.num_types = 0
|
|
|
|
self.num_blocks = 0
|
2020-05-09 17:27:05 +03:00
|
|
|
self.types = self.types[:0]
|
|
|
|
self.lengths = self.lengths[:0]
|
2019-03-07 01:55:38 +03:00
|
|
|
self.types_alloc_size = 0
|
|
|
|
self.lengths_alloc_size = 0
|
|
|
|
}
|
|
|
|
|
2020-05-09 02:48:16 +03:00
|
|
|
func splitBlock(cmds []command, data []byte, pos uint, mask uint, params *encoderParams, literal_split *blockSplit, insert_and_copy_split *blockSplit, dist_split *blockSplit) {
|
2019-03-07 01:55:38 +03:00
|
|
|
{
|
2020-05-09 02:48:16 +03:00
|
|
|
var literals_count uint = countLiterals(cmds)
|
2019-03-07 01:55:38 +03:00
|
|
|
var literals []byte = make([]byte, literals_count)
|
|
|
|
|
|
|
|
/* Create a continuous array of literals. */
|
2020-05-09 02:48:16 +03:00
|
|
|
copyLiteralsToByteArray(cmds, data, pos, mask, literals)
|
2019-03-07 01:55:38 +03:00
|
|
|
|
|
|
|
/* Create the block split on the array of literals.
|
|
|
|
Literal histograms have alphabet size 256. */
|
2019-03-15 22:05:31 +03:00
|
|
|
splitByteVectorLiteral(literals, literals_count, kSymbolsPerLiteralHistogram, kMaxLiteralHistograms, kLiteralStrideLength, kLiteralBlockSwitchCost, params, literal_split)
|
2019-03-07 01:55:38 +03:00
|
|
|
|
|
|
|
literals = nil
|
|
|
|
}
|
|
|
|
{
|
2020-05-09 02:48:16 +03:00
|
|
|
var insert_and_copy_codes []uint16 = make([]uint16, len(cmds))
|
2019-03-07 01:55:38 +03:00
|
|
|
/* Compute prefix codes for commands. */
|
|
|
|
|
2020-05-09 02:48:16 +03:00
|
|
|
for i := range cmds {
|
2019-03-07 01:55:38 +03:00
|
|
|
insert_and_copy_codes[i] = cmds[i].cmd_prefix_
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Create the block split on the array of command prefixes. */
|
2020-05-09 02:48:16 +03:00
|
|
|
splitByteVectorCommand(insert_and_copy_codes, kSymbolsPerCommandHistogram, kMaxCommandHistograms, kCommandStrideLength, kCommandBlockSwitchCost, params, insert_and_copy_split)
|
2019-03-07 01:55:38 +03:00
|
|
|
|
|
|
|
/* TODO: reuse for distances? */
|
|
|
|
|
|
|
|
insert_and_copy_codes = nil
|
|
|
|
}
|
|
|
|
{
|
2020-05-09 02:48:16 +03:00
|
|
|
var distance_prefixes []uint16 = make([]uint16, len(cmds))
|
2019-03-07 01:55:38 +03:00
|
|
|
var j uint = 0
|
|
|
|
/* Create a continuous array of distance prefixes. */
|
|
|
|
|
2020-05-09 02:48:16 +03:00
|
|
|
for i := range cmds {
|
2019-03-15 22:05:31 +03:00
|
|
|
var cmd *command = &cmds[i]
|
|
|
|
if commandCopyLen(cmd) != 0 && cmd.cmd_prefix_ >= 128 {
|
2019-03-07 01:55:38 +03:00
|
|
|
distance_prefixes[j] = cmd.dist_prefix_ & 0x3FF
|
|
|
|
j++
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Create the block split on the array of distance prefixes. */
|
2019-03-15 22:05:31 +03:00
|
|
|
splitByteVectorDistance(distance_prefixes, j, kSymbolsPerDistanceHistogram, kMaxCommandHistograms, kCommandStrideLength, kDistanceBlockSwitchCost, params, dist_split)
|
2019-03-07 01:55:38 +03:00
|
|
|
|
|
|
|
distance_prefixes = nil
|
|
|
|
}
|
|
|
|
}
|