2017-04-10 11:59:45 -07:00
|
|
|
// Copyright 2017 The Prometheus Authors
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
2017-05-02 16:32:09 -07:00
|
|
|
// The code in this file was largely written by Damian Gryski as part of
|
|
|
|
// https://github.com/dgryski/go-tsz and published under the license below.
|
|
|
|
// It received minor modifications to suit Prometheus's needs.
|
|
|
|
|
|
|
|
// Copyright (c) 2015,2016 Damian Gryski <damian@gryski.com>
|
|
|
|
// All rights reserved.
|
|
|
|
|
|
|
|
// Redistribution and use in source and binary forms, with or without
|
|
|
|
// modification, are permitted provided that the following conditions are met:
|
|
|
|
|
|
|
|
// * Redistributions of source code must retain the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer.
|
|
|
|
//
|
|
|
|
// * Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer in the documentation
|
|
|
|
// and/or other materials provided with the distribution.
|
|
|
|
//
|
|
|
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND
|
|
|
|
// ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED
|
|
|
|
// WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
|
|
|
// DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE
|
|
|
|
// FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
|
|
|
|
// DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR
|
|
|
|
// SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
|
|
|
|
// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
|
|
|
// OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
|
|
// OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
|
2017-11-30 06:34:49 -08:00
|
|
|
package chunkenc
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2020-06-18 02:19:39 -07:00
|
|
|
import (
|
|
|
|
"encoding/binary"
|
|
|
|
"io"
|
|
|
|
)
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2017-04-28 06:41:42 -07:00
|
|
|
// bstream is a stream of bits.
|
2016-11-20 07:14:21 -08:00
|
|
|
type bstream struct {
|
2021-10-25 06:14:15 -07:00
|
|
|
stream []byte // The data stream.
|
|
|
|
count uint8 // How many right-most bits are available for writing in the current byte (the last byte of the stream).
|
2016-11-20 07:14:21 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
func (b *bstream) bytes() []byte {
|
|
|
|
return b.stream
|
|
|
|
}
|
|
|
|
|
|
|
|
type bit bool
|
|
|
|
|
|
|
|
const (
|
|
|
|
zero bit = false
|
|
|
|
one bit = true
|
|
|
|
)
|
|
|
|
|
|
|
|
func (b *bstream) writeBit(bit bit) {
|
|
|
|
if b.count == 0 {
|
|
|
|
b.stream = append(b.stream, 0)
|
|
|
|
b.count = 8
|
|
|
|
}
|
|
|
|
|
|
|
|
i := len(b.stream) - 1
|
|
|
|
|
|
|
|
if bit {
|
|
|
|
b.stream[i] |= 1 << (b.count - 1)
|
|
|
|
}
|
|
|
|
|
|
|
|
b.count--
|
|
|
|
}
|
|
|
|
|
|
|
|
func (b *bstream) writeByte(byt byte) {
|
|
|
|
if b.count == 0 {
|
|
|
|
b.stream = append(b.stream, 0)
|
|
|
|
b.count = 8
|
|
|
|
}
|
|
|
|
|
|
|
|
i := len(b.stream) - 1
|
|
|
|
|
2021-10-25 06:14:15 -07:00
|
|
|
// Complete the last byte with the leftmost b.count bits from byt.
|
2016-11-20 07:14:21 -08:00
|
|
|
b.stream[i] |= byt >> (8 - b.count)
|
|
|
|
|
|
|
|
b.stream = append(b.stream, 0)
|
|
|
|
i++
|
2021-10-25 06:14:15 -07:00
|
|
|
// Write the remainder, if any.
|
2016-11-20 07:14:21 -08:00
|
|
|
b.stream[i] = byt << b.count
|
|
|
|
}
|
|
|
|
|
2021-10-25 06:14:15 -07:00
|
|
|
// writeBits writes the nbits right-most bits of u to the stream
|
|
|
|
// in left-to-right order.
|
2016-11-20 07:14:21 -08:00
|
|
|
func (b *bstream) writeBits(u uint64, nbits int) {
|
2021-07-29 05:56:57 -07:00
|
|
|
u <<= 64 - uint(nbits)
|
2016-11-20 07:14:21 -08:00
|
|
|
for nbits >= 8 {
|
|
|
|
byt := byte(u >> 56)
|
|
|
|
b.writeByte(byt)
|
|
|
|
u <<= 8
|
|
|
|
nbits -= 8
|
|
|
|
}
|
|
|
|
|
|
|
|
for nbits > 0 {
|
|
|
|
b.writeBit((u >> 63) == 1)
|
|
|
|
u <<= 1
|
|
|
|
nbits--
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
type bstreamReader struct {
|
|
|
|
stream []byte
|
|
|
|
streamOffset int // The offset from which read the next byte from the stream.
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
buffer uint64 // The current buffer, filled from the stream, containing up to 8 bytes from which read bits.
|
2021-10-25 06:14:15 -07:00
|
|
|
valid uint8 // The number of right-most bits valid to read (from left) in the current 8 byte buffer.
|
2022-09-27 07:02:05 -07:00
|
|
|
last byte // A copy of the last byte of the stream.
|
2020-06-15 08:44:40 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
func newBReader(b []byte) bstreamReader {
|
2022-09-27 07:02:05 -07:00
|
|
|
// The last byte of the stream can be updated later, so we take a copy.
|
|
|
|
var last byte
|
|
|
|
if len(b) > 0 {
|
|
|
|
last = b[len(b)-1]
|
|
|
|
}
|
2020-06-15 08:44:40 -07:00
|
|
|
return bstreamReader{
|
|
|
|
stream: b,
|
2022-09-27 07:02:05 -07:00
|
|
|
last: last,
|
2020-06-15 08:44:40 -07:00
|
|
|
}
|
|
|
|
}
|
2016-11-30 12:50:39 -08:00
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
func (b *bstreamReader) readBit() (bit, error) {
|
|
|
|
if b.valid == 0 {
|
|
|
|
if !b.loadNextBuffer(1) {
|
2016-11-20 07:14:21 -08:00
|
|
|
return false, io.EOF
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
return b.readBitFast()
|
2016-11-30 13:10:10 -08:00
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
// readBitFast is like readBit but can return io.EOF if the internal buffer is empty.
|
|
|
|
// If it returns io.EOF, the caller should retry reading bits calling readBit().
|
|
|
|
// This function must be kept small and a leaf in order to help the compiler inlining it
|
|
|
|
// and further improve performances.
|
|
|
|
func (b *bstreamReader) readBitFast() (bit, error) {
|
|
|
|
if b.valid == 0 {
|
|
|
|
return false, io.EOF
|
2016-11-20 07:14:21 -08:00
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
b.valid--
|
|
|
|
bitmask := uint64(1) << b.valid
|
|
|
|
return (b.buffer & bitmask) != 0, nil
|
|
|
|
}
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2021-10-25 06:14:15 -07:00
|
|
|
// readBits constructs a uint64 with the nbits right-most bits
|
|
|
|
// read from the stream, and any other bits 0.
|
2020-06-15 08:44:40 -07:00
|
|
|
func (b *bstreamReader) readBits(nbits uint8) (uint64, error) {
|
|
|
|
if b.valid == 0 {
|
|
|
|
if !b.loadNextBuffer(nbits) {
|
2016-11-20 07:14:21 -08:00
|
|
|
return 0, io.EOF
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
if nbits <= b.valid {
|
|
|
|
return b.readBitsFast(nbits)
|
2016-11-20 07:14:21 -08:00
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
// We have to read all remaining valid bits from the current buffer and a part from the next one.
|
|
|
|
bitmask := (uint64(1) << b.valid) - 1
|
|
|
|
nbits -= b.valid
|
|
|
|
v := (b.buffer & bitmask) << nbits
|
|
|
|
b.valid = 0
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
if !b.loadNextBuffer(nbits) {
|
2016-11-20 07:14:21 -08:00
|
|
|
return 0, io.EOF
|
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
bitmask = (uint64(1) << nbits) - 1
|
2023-04-09 00:08:40 -07:00
|
|
|
v |= ((b.buffer >> (b.valid - nbits)) & bitmask)
|
2020-06-15 08:44:40 -07:00
|
|
|
b.valid -= nbits
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
return v, nil
|
2016-11-20 07:14:21 -08:00
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
// readBitsFast is like readBits but can return io.EOF if the internal buffer is empty.
|
|
|
|
// If it returns io.EOF, the caller should retry reading bits calling readBits().
|
|
|
|
// This function must be kept small and a leaf in order to help the compiler inlining it
|
|
|
|
// and further improve performances.
|
|
|
|
func (b *bstreamReader) readBitsFast(nbits uint8) (uint64, error) {
|
|
|
|
if nbits > b.valid {
|
|
|
|
return 0, io.EOF
|
|
|
|
}
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
bitmask := (uint64(1) << nbits) - 1
|
|
|
|
b.valid -= nbits
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
return (b.buffer >> b.valid) & bitmask, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (b *bstreamReader) ReadByte() (byte, error) {
|
|
|
|
v, err := b.readBits(8)
|
|
|
|
if err != nil {
|
|
|
|
return 0, err
|
2016-11-20 07:14:21 -08:00
|
|
|
}
|
2020-06-15 08:44:40 -07:00
|
|
|
return byte(v), nil
|
|
|
|
}
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
// loadNextBuffer loads the next bytes from the stream into the internal buffer.
|
|
|
|
// The input nbits is the minimum number of bits that must be read, but the implementation
|
|
|
|
// can read more (if possible) to improve performances.
|
|
|
|
func (b *bstreamReader) loadNextBuffer(nbits uint8) bool {
|
|
|
|
if b.streamOffset >= len(b.stream) {
|
|
|
|
return false
|
2016-11-20 07:14:21 -08:00
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
// Handle the case there are more then 8 bytes in the buffer (most common case)
|
|
|
|
// in a optimized way. It's guaranteed that this branch will never read from the
|
|
|
|
// very last byte of the stream (which suffers race conditions due to concurrent
|
|
|
|
// writes).
|
|
|
|
if b.streamOffset+8 < len(b.stream) {
|
2020-06-18 02:19:39 -07:00
|
|
|
b.buffer = binary.BigEndian.Uint64(b.stream[b.streamOffset:])
|
2020-06-15 08:44:40 -07:00
|
|
|
b.streamOffset += 8
|
|
|
|
b.valid = 64
|
|
|
|
return true
|
|
|
|
}
|
2016-11-20 07:14:21 -08:00
|
|
|
|
2022-09-27 07:02:05 -07:00
|
|
|
// We're here if there are 8 or less bytes left in the stream.
|
|
|
|
// The following code is slower but called less frequently.
|
2020-06-15 08:44:40 -07:00
|
|
|
nbytes := int((nbits / 8) + 1)
|
|
|
|
if b.streamOffset+nbytes > len(b.stream) {
|
|
|
|
nbytes = len(b.stream) - b.streamOffset
|
|
|
|
}
|
|
|
|
|
|
|
|
buffer := uint64(0)
|
2022-09-27 07:02:05 -07:00
|
|
|
skip := 0
|
|
|
|
if b.streamOffset+nbytes == len(b.stream) {
|
|
|
|
// There can be concurrent writes happening on the very last byte
|
|
|
|
// of the stream, so use the copy we took at initialization time.
|
2023-04-09 00:08:40 -07:00
|
|
|
buffer |= uint64(b.last)
|
2022-09-27 07:02:05 -07:00
|
|
|
// Read up to the byte before
|
|
|
|
skip = 1
|
|
|
|
}
|
|
|
|
|
|
|
|
for i := 0; i < nbytes-skip; i++ {
|
2023-04-09 00:08:40 -07:00
|
|
|
buffer |= (uint64(b.stream[b.streamOffset+i]) << uint(8*(nbytes-i-1)))
|
2016-11-20 07:14:21 -08:00
|
|
|
}
|
|
|
|
|
2020-06-15 08:44:40 -07:00
|
|
|
b.buffer = buffer
|
|
|
|
b.streamOffset += nbytes
|
|
|
|
b.valid = uint8(nbytes * 8)
|
|
|
|
|
|
|
|
return true
|
2016-11-20 07:14:21 -08:00
|
|
|
}
|