Merge pull request #9509 from prometheus/beorn7/sparsehistogram

Histogram encoding improvementes
2025-03-05 20:59:13 -08:00 · 2021-10-18 15:45:20 +02:00 · 2021-10-18 15:45:20 +02:00 · 8c1507ebaa
parent 7309c20e7e ad9b4c2b68
commit 8c1507ebaa
6 changed files with 373 additions and 122 deletions
--- a/tsdb/chunkenc/histogram.go
+++ b/tsdb/chunkenc/histogram.go
@ -153,10 +153,8 @@ func (c *HistogramChunk) Appender() (Appender, error) {
 		sum:      it.sum,
 		leading:  it.leading,
 		trailing: it.trailing,
 		buf64: make([]byte, binary.MaxVarintLen64),
 	}
-	if binary.BigEndian.Uint16(a.b.bytes()) == 0 {
+	if it.numTotal == 0 {
 		a.leading = 0xff
 	}
 	return a, nil
@ -222,20 +220,6 @@ type HistogramAppender struct {
 	sum      float64
 	leading  uint8
 	trailing uint8
 	buf64 []byte // For working on varint64's.
 }
 func putVarint(b *bstream, buf []byte, x int64) {
 	for _, byt := range buf[:binary.PutVarint(buf, x)] {
 		b.writeByte(byt)
 	}
 }
 func putUvarint(b *bstream, buf []byte, x uint64) {
 	for _, byt := range buf[:binary.PutUvarint(buf, x)] {
 		b.writeByte(byt)
 	}
 }
 // Append implements Appender. This implementation panics because normal float
@ -418,18 +402,21 @@ func (a *HistogramAppender) AppendHistogram(t int64, h histogram.Histogram) {
 		a.nBucketsDelta = make([]int64, numNBuckets)
 		// Now store the actual data.
-		putVarint(a.b, a.buf64, t)
+		putVarbitInt(a.b, t)
-		putUvarint(a.b, a.buf64, h.Count)     // TODO(beorn7): Use putVarbitInt?
+		putVarbitUint(a.b, h.Count)
-		putUvarint(a.b, a.buf64, h.ZeroCount) // TODO(beorn7): Use putVarbitInt?
+		putVarbitUint(a.b, h.ZeroCount) //
 		a.b.writeBits(math.Float64bits(h.Sum), 64)
-		for _, buck := range h.PositiveBuckets {
+		for _, b := range h.PositiveBuckets {
-			putVarint(a.b, a.buf64, buck) // TODO(beorn7): Use putVarbitInt?
+			putVarbitInt(a.b, b)
 		}
-		for _, buck := range h.NegativeBuckets {
+		for _, b := range h.NegativeBuckets {
-			putVarint(a.b, a.buf64, buck) // TODO(beorn7): Use putVarbitInt?
+			putVarbitInt(a.b, b)
 		}
 	case 1:
 		tDelta = t - a.t
 		if tDelta < 0 {
 			panic("out of order timestamp")
 		}
 		cntDelta = int64(h.Count) - int64(a.cnt)
 		zCntDelta = int64(h.ZeroCount) - int64(a.zCnt)
@ -437,20 +424,20 @@ func (a *HistogramAppender) AppendHistogram(t int64, h histogram.Histogram) {
 			cntDelta, zCntDelta = 0, 0
 		}
-		putVarint(a.b, a.buf64, tDelta)    // TODO(beorn7): This should probably be putUvarint.
+		putVarbitUint(a.b, uint64(tDelta))
-		putVarint(a.b, a.buf64, cntDelta)  // TODO(beorn7): Use putVarbitInt?
+		putVarbitInt(a.b, cntDelta)
-		putVarint(a.b, a.buf64, zCntDelta) // TODO(beorn7): Use putVarbitInt?
+		putVarbitInt(a.b, zCntDelta)
 		a.writeSumDelta(h.Sum)
-		for i, buck := range h.PositiveBuckets {
+		for i, b := range h.PositiveBuckets {
-			delta := buck - a.pBuckets[i]
+			delta := b - a.pBuckets[i]
-			putVarint(a.b, a.buf64, delta) // TODO(beorn7): Use putVarbitInt?
+			putVarbitInt(a.b, delta)
 			a.pBucketsDelta[i] = delta
 		}
-		for i, buck := range h.NegativeBuckets {
+		for i, b := range h.NegativeBuckets {
-			delta := buck - a.nBuckets[i]
+			delta := b - a.nBuckets[i]
-			putVarint(a.b, a.buf64, delta) // TODO(beorn7): Use putVarbitInt?
+			putVarbitInt(a.b, delta)
 			a.nBucketsDelta[i] = delta
 		}
@ -721,21 +708,21 @@ func (it *histogramIterator) Next() bool {
 		}
 		// Now read the actual data.
-		t, err := binary.ReadVarint(&it.br)
+		t, err := readVarbitInt(&it.br)
 		if err != nil {
 			it.err = err
 			return false
 		}
 		it.t = t
-		cnt, err := binary.ReadUvarint(&it.br)
+		cnt, err := readVarbitUint(&it.br)
 		if err != nil {
 			it.err = err
 			return false
 		}
 		it.cnt = cnt
-		zcnt, err := binary.ReadUvarint(&it.br)
+		zcnt, err := readVarbitUint(&it.br)
 		if err != nil {
 			it.err = err
 			return false
@ -750,7 +737,7 @@ func (it *histogramIterator) Next() bool {
 		it.sum = math.Float64frombits(sum)
 		for i := range it.pBuckets {
-			v, err := binary.ReadVarint(&it.br)
+			v, err := readVarbitInt(&it.br)
 			if err != nil {
 				it.err = err
 				return false
@ -758,7 +745,7 @@ func (it *histogramIterator) Next() bool {
 			it.pBuckets[i] = v
 		}
 		for i := range it.nBuckets {
-			v, err := binary.ReadVarint(&it.br)
+			v, err := readVarbitInt(&it.br)
 			if err != nil {
 				it.err = err
 				return false
@ -771,15 +758,15 @@ func (it *histogramIterator) Next() bool {
 	}
 	if it.numRead == 1 {
-		tDelta, err := binary.ReadVarint(&it.br)
+		tDelta, err := readVarbitUint(&it.br)
 		if err != nil {
 			it.err = err
 			return false
 		}
-		it.tDelta = tDelta
+		it.tDelta = int64(tDelta)
-		it.t += int64(it.tDelta)
+		it.t += it.tDelta
-		cntDelta, err := binary.ReadVarint(&it.br)
+		cntDelta, err := readVarbitInt(&it.br)
 		if err != nil {
 			it.err = err
 			return false
@ -787,7 +774,7 @@ func (it *histogramIterator) Next() bool {
 		it.cntDelta = cntDelta
 		it.cnt = uint64(int64(it.cnt) + it.cntDelta)
-		zcntDelta, err := binary.ReadVarint(&it.br)
+		zcntDelta, err := readVarbitInt(&it.br)
 		if err != nil {
 			it.err = err
 			return false
@ -806,7 +793,7 @@ func (it *histogramIterator) Next() bool {
 		}
 		for i := range it.pBuckets {
-			delta, err := binary.ReadVarint(&it.br)
+			delta, err := readVarbitInt(&it.br)
 			if err != nil {
 				it.err = err
 				return false
@ -816,7 +803,7 @@ func (it *histogramIterator) Next() bool {
 		}
 		for i := range it.nBuckets {
-			delta, err := binary.ReadVarint(&it.br)
+			delta, err := readVarbitInt(&it.br)
 			if err != nil {
 				it.err = err
 				return false
--- a/tsdb/chunkenc/histogram_meta.go
+++ b/tsdb/chunkenc/histogram_meta.go
@ -14,40 +14,34 @@
 package chunkenc
 import (
 	"math"
 	"github.com/prometheus/prometheus/model/histogram"
 )
 func writeHistogramChunkLayout(b *bstream, schema int32, zeroThreshold float64, positiveSpans, negativeSpans []histogram.Span) {
 	putZeroThreshold(b, zeroThreshold)
 	putVarbitInt(b, int64(schema))
 	putVarbitFloat(b, zeroThreshold)
 	putHistogramChunkLayoutSpans(b, positiveSpans)
 	putHistogramChunkLayoutSpans(b, negativeSpans)
 }
 func putHistogramChunkLayoutSpans(b *bstream, spans []histogram.Span) {
 	putVarbitInt(b, int64(len(spans)))
 	for _, s := range spans {
 		putVarbitInt(b, int64(s.Length))
 		putVarbitInt(b, int64(s.Offset))
 	}
 }
 func readHistogramChunkLayout(b *bstreamReader) (
 	schema int32, zeroThreshold float64,
 	positiveSpans, negativeSpans []histogram.Span,
 	err error,
 ) {
 	zeroThreshold, err = readZeroThreshold(b)
 	if err != nil {
 		return
 	}
 	v, err := readVarbitInt(b)
 	if err != nil {
 		return
 	}
 	schema = int32(v)
 	zeroThreshold, err = readVarbitFloat(b)
 	if err != nil {
 		return
 	}
 	positiveSpans, err = readHistogramChunkLayoutSpans(b)
 	if err != nil {
 		return
@ -61,15 +55,23 @@ func readHistogramChunkLayout(b *bstreamReader) (
 	return
 }
 func putHistogramChunkLayoutSpans(b *bstream, spans []histogram.Span) {
 	putVarbitUint(b, uint64(len(spans)))
 	for _, s := range spans {
 		putVarbitUint(b, uint64(s.Length))
 		putVarbitInt(b, int64(s.Offset))
 	}
 }
 func readHistogramChunkLayoutSpans(b *bstreamReader) ([]histogram.Span, error) {
 	var spans []histogram.Span
-	num, err := readVarbitInt(b)
+	num, err := readVarbitUint(b)
 	if err != nil {
 		return nil, err
 	}
 	for i := 0; i < int(num); i++ {
-		length, err := readVarbitInt(b)
+		length, err := readVarbitUint(b)
 		if err != nil {
 			return nil, err
 		}
@ -87,6 +89,57 @@ func readHistogramChunkLayoutSpans(b *bstreamReader) ([]histogram.Span, error) {
 	return spans, nil
 }
 // putZeroThreshold writes the zero threshold to the bstream. It stores typical
 // values in just one byte, but needs 9 bytes for other values. In detail:
 //
 // * If the threshold is 0, store a single zero byte.
 //
 // * If the threshold is a power of 2 between (and including) 2^-243 and 2^10,
 //   take the exponent from the IEEE 754 representation of the threshold, which
 //   covers a range between (and including) -242 and 11. (2^-243 is 0.5*2^-242
 //   in IEEE 754 representation, and 2^10 is 0.5*2^11.) Add 243 to the exponent
 //   and store the result (which will be between 1 and 254) as a single
 //   byte. Note that small powers of two are preferred values for the zero
 //   threshold. The default value for the zero threshold is 2^-128 (or
 //   0.5*2^-127 in IEEE 754 representation) and will therefore be encoded as a
 //   single byte (with value 116).
 //
 // * In all other cases, store 255 as a single byte, followed by the 8 bytes of
 //   the threshold as a float64, i.e. taking 9 bytes in total.
 func putZeroThreshold(b *bstream, threshold float64) {
 	if threshold == 0 {
 		b.writeByte(0)
 		return
 	}
 	frac, exp := math.Frexp(threshold)
 	if frac != 0.5 || exp < -242 || exp > 11 {
 		b.writeByte(255)
 		b.writeBits(math.Float64bits(threshold), 64)
 		return
 	}
 	b.writeByte(byte(exp + 243))
 }
 // readZeroThreshold reads the zero threshold written with putZeroThreshold.
 func readZeroThreshold(br *bstreamReader) (float64, error) {
 	b, err := br.ReadByte()
 	if err != nil {
 		return 0, err
 	}
 	switch b {
 	case 0:
 		return 0, nil
 	case 255:
 		v, err := br.readBits(64)
 		if err != nil {
 			return 0, err
 		}
 		return math.Float64frombits(v), nil
 	default:
 		return math.Ldexp(0.5, int(b-243)), nil
 	}
 }
 type bucketIterator struct {
 	spans  []histogram.Span
 	span   int // Span position of last yielded bucket.
--- a/tsdb/chunkenc/varbit.go
+++ b/tsdb/chunkenc/varbit.go
@ -14,46 +14,14 @@
 package chunkenc
 import (
-	"math"
+	"math/bits"
 	"github.com/pkg/errors"
 )
 // putVarbitFloat writes a float64 using varbit encoding.  It does so by
 // converting the underlying bits into an int64.
 func putVarbitFloat(b *bstream, val float64) {
 	// TODO(beorn7): The resulting int64 here will almost never be a small
 	// integer. Thus, the varbit encoding doesn't really make sense
 	// here. This function is only used to encode the zero threshold in
 	// histograms. Based on that, here is an idea to improve the encoding:
 	//
 	// It is recommended to use (usually negative) powers of two as
 	// threshoulds. The default value for the zero threshald is in fact
 	// 2^-128, or 0.5*2^-127, as it is represented by IEEE 754. It is
 	// therefore worth a try to test if the threshold is a power of 2 and
 	// then just store the exponent. 0 is also a commen threshold for those
 	// use cases where only observations of precisely zero should go to the
 	// zero bucket. This results in the following proposal:
 	// - First we store 1 byte.
 	// - Iff that byte is 255 (all bits set), it is followed by a direct
 	//   8byte representation of the float.
 	// - If the byte is 0, the threshold is 0.
 	// - In all other cases, take the number represented by the byte,
 	//   subtract 246, and that's the exponent (i.e. between -245 and
 	//   +8, covering thresholds that are powers of 2 between 2^-246
 	//   to 128).
 	putVarbitInt(b, int64(math.Float64bits(val)))
 }
 // readVarbitFloat reads a float64 encoded with putVarbitFloat
 func readVarbitFloat(b *bstreamReader) (float64, error) {
 	val, err := readVarbitInt(b)
 	if err != nil {
 		return 0, err
 	}
 	return math.Float64frombits(uint64(val)), nil
 }
 // putVarbitInt writes an int64 using varbit encoding with a bit bucketing
-// optimized for the dod's observed in histogram buckets.
+// optimized for the dod's observed in histogram buckets, plus a few additional
 // buckets for large numbers.
 //
 // TODO(Dieterbe): We could improve this further: Each branch doesn't need to
 // support any values of any of the prior branches. So we can expand the range
@ -62,22 +30,31 @@ func readVarbitFloat(b *bstreamReader) (float64, error) {
 // center-piece we skip).
 func putVarbitInt(b *bstream, val int64) {
 	switch {
-	case val == 0:
+	case val == 0: // Precisely 0, needs 1 bit.
 		b.writeBit(zero)
-	case bitRange(val, 3): // -3 <= val <= 4
+	case bitRange(val, 3): // -3 <= val <= 4, needs 5 bits.
 		b.writeBits(0b10, 2)
 		b.writeBits(uint64(val), 3)
-	case bitRange(val, 6): // -31 <= val <= 32
+	case bitRange(val, 6): // -31 <= val <= 32, 9 bits.
 		b.writeBits(0b110, 3)
 		b.writeBits(uint64(val), 6)
-	case bitRange(val, 9): // -255 <= val <= 256
+	case bitRange(val, 9): // -255 <= val <= 256, 13 bits.
 		b.writeBits(0b1110, 4)
 		b.writeBits(uint64(val), 9)
-	case bitRange(val, 12): // -2047 <= val <= 2048
+	case bitRange(val, 12): // -2047 <= val <= 2048, 17 bits.
 		b.writeBits(0b11110, 5)
 		b.writeBits(uint64(val), 12)
 	case bitRange(val, 18): // -131071 <= val <= 131072, 3 bytes.
 		b.writeBits(0b111110, 6)
 		b.writeBits(uint64(val), 18)
 	case bitRange(val, 25): // -16777215 <= val <= 16777216, 4 bytes.
 		b.writeBits(0b1111110, 7)
 		b.writeBits(uint64(val), 25)
 	case bitRange(val, 56): // -36028797018963967 <= val <= 36028797018963968, 8 bytes.
 		b.writeBits(0b11111110, 8)
 		b.writeBits(uint64(val), 56)
 	default:
-		b.writeBits(0b11111, 5)
+		b.writeBits(0b11111111, 8) // Worst case, needs 9 bytes.
 		b.writeBits(uint64(val), 64)
 	}
 }
@ -85,7 +62,7 @@ func putVarbitInt(b *bstream, val int64) {
 // readVarbitInt reads an int64 encoced with putVarbitInt.
 func readVarbitInt(b *bstreamReader) (int64, error) {
 	var d byte
-	for i := 0; i < 5; i++ {
+	for i := 0; i < 8; i++ {
 		d <<= 1
 		bit, err := b.readBitFast()
 		if err != nil {
@ -114,7 +91,13 @@ func readVarbitInt(b *bstreamReader) (int64, error) {
 		sz = 9
 	case 0b11110:
 		sz = 12
-	case 0b11111:
+	case 0b111110:
 		sz = 18
 	case 0b1111110:
 		sz = 25
 	case 0b11111110:
 		sz = 56
 	case 0b11111111:
 		// Do not use fast because it's very unlikely it will succeed.
 		bits, err := b.readBits(64)
 		if err != nil {
@ -122,6 +105,8 @@ func readVarbitInt(b *bstreamReader) (int64, error) {
 		}
 		val = int64(bits)
 	default:
 		return 0, errors.Errorf("invalid bit pattern %b", d)
 	}
 	if sz != 0 {
@ -141,3 +126,104 @@ func readVarbitInt(b *bstreamReader) (int64, error) {
 	return val, nil
 }
 func bitRangeUint(x uint64, nbits int) bool {
 	return bits.LeadingZeros64(x) >= 64-nbits
 }
 // putVarbitUint writes a uint64 using varbit encoding. It uses the same bit
 // buckets as putVarbitInt.
 func putVarbitUint(b *bstream, val uint64) {
 	switch {
 	case val == 0: // Precisely 0, needs 1 bit.
 		b.writeBit(zero)
 	case bitRangeUint(val, 3): // val <= 7, needs 5 bits.
 		b.writeBits(0b10, 2)
 		b.writeBits(val, 3)
 	case bitRangeUint(val, 6): // val <= 63, 9 bits.
 		b.writeBits(0b110, 3)
 		b.writeBits(val, 6)
 	case bitRangeUint(val, 9): // val <= 511, 13 bits.
 		b.writeBits(0b1110, 4)
 		b.writeBits(val, 9)
 	case bitRangeUint(val, 12): // val <= 4095, 17 bits.
 		b.writeBits(0b11110, 5)
 		b.writeBits(val, 12)
 	case bitRangeUint(val, 18): // val <= 262143, 3 bytes.
 		b.writeBits(0b111110, 6)
 		b.writeBits(val, 18)
 	case bitRangeUint(val, 25): // val <= 33554431, 4 bytes.
 		b.writeBits(0b1111110, 7)
 		b.writeBits(val, 25)
 	case bitRangeUint(val, 56): // val <= 72057594037927935, 8 bytes.
 		b.writeBits(0b11111110, 8)
 		b.writeBits(val, 56)
 	default:
 		b.writeBits(0b11111111, 8) // Worst case, needs 9 bytes.
 		b.writeBits(val, 64)
 	}
 }
 // readVarbitUint reads a uint64 encoced with putVarbitUint.
 func readVarbitUint(b *bstreamReader) (uint64, error) {
 	var d byte
 	for i := 0; i < 8; i++ {
 		d <<= 1
 		bit, err := b.readBitFast()
 		if err != nil {
 			bit, err = b.readBit()
 		}
 		if err != nil {
 			return 0, err
 		}
 		if bit == zero {
 			break
 		}
 		d |= 1
 	}
 	var (
 		bits uint64
 		sz   uint8
 		err  error
 	)
 	switch d {
 	case 0b0:
 		// val == 0
 	case 0b10:
 		sz = 3
 	case 0b110:
 		sz = 6
 	case 0b1110:
 		sz = 9
 	case 0b11110:
 		sz = 12
 	case 0b111110:
 		sz = 18
 	case 0b1111110:
 		sz = 25
 	case 0b11111110:
 		sz = 56
 	case 0b11111111:
 		// Do not use fast because it's very unlikely it will succeed.
 		bits, err = b.readBits(64)
 		if err != nil {
 			return 0, err
 		}
 	default:
 		return 0, errors.Errorf("invalid bit pattern %b", d)
 	}
 	if sz != 0 {
 		bits, err = b.readBitsFast(sz)
 		if err != nil {
 			bits, err = b.readBits(sz)
 		}
 		if err != nil {
 			return 0, err
 		}
 	}
 	return bits, nil
 }
--- a/tsdb/chunkenc/varbit_test.go
+++ b/tsdb/chunkenc/varbit_test.go
@ -0,0 +1,85 @@
 // Copyright 2021 The Prometheus Authors
 // Licensed under the Apache License, Version 2.0 (the "License");
 // you may not use this file except in compliance with the License.
 // You may obtain a copy of the License at
 //
 // http://www.apache.org/licenses/LICENSE-2.0
 //
 // Unless required by applicable law or agreed to in writing, software
 // distributed under the License is distributed on an "AS IS" BASIS,
 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 // See the License for the specific language governing permissions and
 // limitations under the License.
 package chunkenc
 import (
 	"math"
 	"testing"
 	"github.com/stretchr/testify/require"
 )
 func TestVarbitInt(t *testing.T) {
 	numbers := []int64{
 		math.MinInt64,
 		-36028797018963968, -36028797018963967,
 		-16777216, -16777215,
 		-131072, -131071,
 		-2048, -2047,
 		-256, -255,
 		-32, -31,
 		-4, -3,
 		-1, 0, 1,
 		4, 5,
 		32, 33,
 		256, 257,
 		2048, 2049,
 		131072, 131073,
 		16777216, 16777217,
 		36028797018963968, 36028797018963969,
 		math.MaxInt64,
 	}
 	bs := bstream{}
 	for _, n := range numbers {
 		putVarbitInt(&bs, n)
 	}
 	bsr := newBReader(bs.bytes())
 	for _, want := range numbers {
 		got, err := readVarbitInt(&bsr)
 		require.NoError(t, err)
 		require.Equal(t, want, got)
 	}
 }
 func TestVarbitUint(t *testing.T) {
 	numbers := []uint64{
 		0, 1,
 		7, 8,
 		63, 64,
 		511, 512,
 		4095, 4096,
 		262143, 262144,
 		33554431, 33554432,
 		72057594037927935, 72057594037927936,
 		math.MaxUint64,
 	}
 	bs := bstream{}
 	for _, n := range numbers {
 		putVarbitUint(&bs, n)
 	}
 	bsr := newBReader(bs.bytes())
 	for _, want := range numbers {
 		got, err := readVarbitUint(&bsr)
 		require.NoError(t, err)
 		require.Equal(t, want, got)
 	}
 }
--- a/tsdb/chunkenc/xor.go
+++ b/tsdb/chunkenc/xor.go
@ -111,7 +111,7 @@ func (c *XORChunk) Appender() (Appender, error) {
 		leading:  it.leading,
 		trailing: it.trailing,
 	}
-	if binary.BigEndian.Uint16(a.b.bytes()) == 0 {
+	if it.numTotal == 0 {
 		a.leading = 0xff
 	}
 	return a, nil
--- a/tsdb/docs/format/chunks.md
+++ b/tsdb/docs/format/chunks.md
@ -34,22 +34,62 @@ in-file offset (lower 4 bytes) and segment sequence number (upper 4 bytes).
 └───────────────┴───────────────────┴──────────────┴────────────────┘
 ```
-## XOR chunk
+Notes:
 * `<uvarint>` has 1 to 10 bytes.
 * `encoding`: Currently either `XOR` or `histogram`.
 * `data`: See below for each encoding.
-TODO(beorn7): Add.
+## XOR chunk data
 ## Histogram chunk
 TODO(beorn7): This is out of date. Update once settled on the (more or less) final format.
 ```
-┌──────────────┬─────────────────┬──────────────────────────┬──────────────────────────┬──────────────┐
+┌──────────────────────┬───────────────┬───────────────┬──────────────────────┬──────────────────────┬──────────────────────┬──────────────────────┬─────┐
-│ len <uint16> │ schema <varint> │ pos-spans <span-section> │ neg-spans <span-section> │ data <bytes> │
+│ num_samples <uint16> │ ts_0 <varint> │ v_0 <float64> │ ts_1_delta <uvarint> │ v_1_xor <varbit_xor> │ ts_n_dod <varbit_ts> │ v_n_xor <varbit_xor> │ ... │
-└──────────────┴─────────────────┴──────────────────────────┴──────────────────────────┴──────────────┘
+└──────────────────────┴───────────────┴───────────────┴──────────────────────┴──────────────────────┴──────────────────────┴──────────────────────┴─────┘
 span-section:
 ┌──────────────┬──────────────────┬──────────────────┬────────────┐
 │ len <varint> │ length1 <varint> │ offset1 <varint> │ length2... │
 └──────────────┴──────────────────┴──────────────────┴────────────┘
 ```
 ### Notes:
 * `ts` is the timestamp, `v` is the value.
 * `...` means to repeat the previous two fields as needed, with `n` starting at 2 and going up to `num_samples` – 1.
 * `<uint16>` has 2 bytes in big-endian order.
 * `<varint>` and `<uvarint>` have 1 to 10 bytes each.
 * `ts_1_delta` is `ts_1` – `ts_0`.
 * `ts_n_dod` is the “delta of deltas” of timestamps, i.e. (`ts_n` – `ts_n-1`) – (`ts_n-1` – `ts_n-2`).
 * `<v_n_xor>` is the result of `v_n` XOR `v_n-1`.
 * `<varbit_xor>` is a specific variable bitwidth encoding of the result of XORing the current and the previous value. It has between 1 bit and 77 bits.
  See [code for details](https://github.com/prometheus/prometheus/blob/7309c20e7e5774e7838f183ec97c65baa4362edc/tsdb/chunkenc/xor.go#L220-L253).
 * `<varbit_ts>` is a specific variable bitwidth encoding for the “delta of deltas” of timestamps (signed integers that are ideally small).
  It has between 1 and 68 bits.
  see [code for details](https://github.com/prometheus/prometheus/blob/7309c20e7e5774e7838f183ec97c65baa4362edc/tsdb/chunkenc/xor.go#L179-L205).
 ## Histogram chunk data
 ```
 ┌──────────────────────┬───────────────────────────────┬─────────────────────┬──────────────────┬──────────────────┬────────────────┐
 │ num_samples <uint16> │ zero_threshold <1 or 9 bytes> │ schema <varbit_int> │ pos_spans <data> │ neg_spans <data> │ samples <data> │
 └──────────────────────┴───────────────────────────────┴─────────────────────┴──────────────────┴──────────────────┴────────────────┘
 ```
 ### Positive and negative spans data:
 ```
 ┌───────────────────┬────────────────────────┬───────────────────────┬─────┬──────────────────────────┬─────────────────────────┐
 │ num <varbit_uint> │ length_1 <varbit_uint> │ offset_1 <varbit_int> │ ... │ length_num <varbit_uint> │ offset_num <varbit_int> │
 └───────────────────┴────────────────────────┴───────────────────────┴─────┴──────────────────────────┴─────────────────────────┘
 ```
 ### Samples data:
 ```
 TODO
 ```
 ### Notes:
 * `zero_threshold` has a specific encoding:
  * If 0, it is a single zero byte.
  * If a power of two between 2^-243 and 2^10, it is a single byte between 1 and 254.
  * Otherwise, it is a byte with all bits set (255), followed by a float64, resulting in 9 bytes length.
 * `schema` is a specific value defined by the exposition format. Currently valid values are -4 <= n <= 8.
 * `<varbit_int>` is a variable bitwidth encoding for signed integers, optimized for “delta of deltas” of bucket deltas. It has between 1 bit and 9 bytes.
 * `<varbit_uint>` is a variable bitwidth encoding for unsigned integers with the same bit-bucketing as `<varbit_int>`.