2021-06-30 03:45:43 -07:00
// Copyright 2021 The Prometheus Authors
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package chunkenc
2021-08-06 05:38:41 -07:00
import (
"github.com/prometheus/prometheus/pkg/histogram"
)
2021-06-30 03:45:43 -07:00
2021-10-04 06:14:12 -07:00
const (
2021-10-06 03:32:19 -07:00
counterResetMask = 0b10000000
notCounterResetMask = 0b01000000
2021-10-04 06:14:12 -07:00
)
2021-10-06 03:32:19 -07:00
func writeHistoChunkMeta ( b * bstream , schema int32 , zeroThreshold float64 , posSpans , negSpans [ ] histogram . Span ) {
2021-06-30 03:45:43 -07:00
putInt64VBBucket ( b , int64 ( schema ) )
2021-08-06 05:38:41 -07:00
putFloat64VBBucket ( b , zeroThreshold )
2021-06-30 03:45:43 -07:00
putHistoChunkMetaSpans ( b , posSpans )
putHistoChunkMetaSpans ( b , negSpans )
}
func putHistoChunkMetaSpans ( b * bstream , spans [ ] histogram . Span ) {
putInt64VBBucket ( b , int64 ( len ( spans ) ) )
for _ , s := range spans {
putInt64VBBucket ( b , int64 ( s . Length ) )
putInt64VBBucket ( b , int64 ( s . Offset ) )
}
}
2021-10-06 03:32:19 -07:00
func readHistoChunkMeta ( b * bstreamReader ) ( schema int32 , zeroThreshold float64 , posSpans [ ] histogram . Span , negSpans [ ] histogram . Span , err error ) {
_ , err = b . ReadByte ( ) // The header.
2021-10-04 06:14:12 -07:00
if err != nil {
2021-10-06 02:58:10 -07:00
return
2021-10-04 06:14:12 -07:00
}
2021-06-30 03:45:43 -07:00
v , err := readInt64VBBucket ( b )
if err != nil {
2021-10-06 02:58:10 -07:00
return
2021-06-30 03:45:43 -07:00
}
2021-10-06 02:58:10 -07:00
schema = int32 ( v )
2021-06-30 03:45:43 -07:00
2021-10-06 02:58:10 -07:00
zeroThreshold , err = readFloat64VBBucket ( b )
2021-08-06 05:38:41 -07:00
if err != nil {
2021-10-06 02:58:10 -07:00
return
2021-08-06 05:38:41 -07:00
}
2021-10-06 02:58:10 -07:00
posSpans , err = readHistoChunkMetaSpans ( b )
2021-06-30 03:45:43 -07:00
if err != nil {
2021-10-06 02:58:10 -07:00
return
2021-06-30 03:45:43 -07:00
}
2021-10-06 02:58:10 -07:00
negSpans , err = readHistoChunkMetaSpans ( b )
2021-06-30 03:45:43 -07:00
if err != nil {
2021-10-06 02:58:10 -07:00
return
2021-06-30 03:45:43 -07:00
}
2021-10-06 02:58:10 -07:00
return
2021-06-30 03:45:43 -07:00
}
func readHistoChunkMetaSpans ( b * bstreamReader ) ( [ ] histogram . Span , error ) {
var spans [ ] histogram . Span
num , err := readInt64VBBucket ( b )
if err != nil {
return nil , err
}
for i := 0 ; i < int ( num ) ; i ++ {
length , err := readInt64VBBucket ( b )
if err != nil {
return nil , err
}
offset , err := readInt64VBBucket ( b )
if err != nil {
return nil , err
}
spans = append ( spans , histogram . Span {
Length : uint32 ( length ) ,
Offset : int32 ( offset ) ,
} )
}
return spans , nil
}
2021-07-01 23:20:30 -07:00
type bucketIterator struct {
spans [ ] histogram . Span
span int // span position of last yielded bucket
bucket int // bucket position within span of last yielded bucket
idx int // bucket index (globally across all spans) of last yielded bucket
}
func newBucketIterator ( spans [ ] histogram . Span ) * bucketIterator {
b := bucketIterator {
spans : spans ,
span : 0 ,
bucket : - 1 ,
idx : - 1 ,
}
if len ( spans ) > 0 {
b . idx += int ( spans [ 0 ] . Offset )
}
return & b
}
func ( b * bucketIterator ) Next ( ) ( int , bool ) {
// we're already out of bounds
if b . span >= len ( b . spans ) {
return 0 , false
}
try :
if b . bucket < int ( b . spans [ b . span ] . Length - 1 ) { // try to move within same span.
b . bucket ++
b . idx ++
return b . idx , true
} else if b . span < len ( b . spans ) - 1 { // try to move from one span to the next
b . span ++
b . idx += int ( b . spans [ b . span ] . Offset + 1 )
b . bucket = 0
if b . spans [ b . span ] . Length == 0 {
// pathological case that should never happen. We can't use this span, let's try again.
goto try
}
return b . idx , true
}
// we're out of options
return 0 , false
}
2021-07-05 06:27:46 -07:00
// Interjection describes that num new buckets are introduced before processing the pos'th delta from the original slice
type Interjection struct {
2021-07-01 23:20:30 -07:00
pos int
num int
}
// compareSpans returns the interjections to convert a slice of deltas to a new slice representing an expanded set of buckets, or false if incompatible (e.g. if buckets were removed)
// For example:
// Let's say the old buckets look like this:
// span syntax: [offset, length]
// spans : [ 0 , 2 ] [2,1] [ 3 , 2 ] [3,1] [1,1]
// bucket idx : [0] [1] 2 3 [4] 5 6 7 [8] [9] 10 11 12 [13] 14 [15]
// raw values 6 3 3 2 4 5 1
// deltas 6 -3 0 -1 2 1 -4
// But now we introduce a new bucket layout. (carefully chosen example where we have a span appended, one unchanged[*], one prepended, and two merge - in that order)
// [*] unchanged in terms of which bucket indices they represent. but to achieve that, their offset needs to change if "disrupted" by spans changing ahead of them
// \/ this one is "unchanged"
// spans : [ 0 , 3 ] [1,1] [ 1 , 4 ] [ 3 , 3 ]
// bucket idx : [0] [1] [2] 3 [4] 5 [6] [7] [8] [9] 10 11 12 [13] [14] [15]
// raw values 6 3 0 3 0 0 2 4 5 0 1
// deltas 6 -3 -3 3 -3 0 2 2 1 -5 1
// delta mods: / \ / \ / \
// note that whenever any new buckets are introduced, the subsequent "old" bucket needs to readjust its delta to the new base of 0
// thus, for the caller, who wants to transform the set of original deltas to a new set of deltas to match a new span layout that adds buckets, we simply
// need to generate a list of interjections
// note: within compareSpans we don't have to worry about the changes to the spans themselves,
// thanks to the iterators, we get to work with the more useful bucket indices (which of course directly correspond to the buckets we have to adjust)
2021-07-05 06:27:46 -07:00
func compareSpans ( a , b [ ] histogram . Span ) ( [ ] Interjection , bool ) {
2021-07-01 23:20:30 -07:00
ai := newBucketIterator ( a )
bi := newBucketIterator ( b )
2021-07-05 06:27:46 -07:00
var interjections [ ] Interjection
2021-07-01 23:20:30 -07:00
// when inter.num becomes > 0, this becomes a valid interjection that should be yielded when we finish a streak of new buckets
2021-07-05 06:27:46 -07:00
var inter Interjection
2021-07-01 23:20:30 -07:00
av , aok := ai . Next ( )
bv , bok := bi . Next ( )
2021-07-05 14:59:33 -07:00
loop :
2021-07-01 23:20:30 -07:00
for {
2021-07-05 14:59:33 -07:00
switch {
case aok && bok :
switch {
case av == bv : // Both have an identical value. move on!
// Finish WIP interjection and reset.
2021-07-01 23:20:30 -07:00
if inter . num > 0 {
interjections = append ( interjections , inter )
}
inter . num = 0
av , aok = ai . Next ( )
bv , bok = bi . Next ( )
2021-07-05 14:59:33 -07:00
inter . pos ++
case av < bv : // b misses a value that is in a.
2021-07-01 23:20:30 -07:00
return interjections , false
2021-07-05 14:59:33 -07:00
case av > bv : // a misses a value that is in b. Forward b and recompare.
2021-07-01 23:20:30 -07:00
inter . num ++
bv , bok = bi . Next ( )
}
2021-07-05 14:59:33 -07:00
case aok && ! bok : // b misses a value that is in a.
2021-07-01 23:20:30 -07:00
return interjections , false
2021-07-05 14:59:33 -07:00
case ! aok && bok : // a misses a value that is in b. Forward b and recompare.
2021-07-01 23:20:30 -07:00
inter . num ++
bv , bok = bi . Next ( )
2021-07-05 14:59:33 -07:00
default : // Both iterators ran out. We're done.
2021-07-01 23:20:30 -07:00
if inter . num > 0 {
interjections = append ( interjections , inter )
}
2021-07-05 14:59:33 -07:00
break loop
2021-07-01 23:20:30 -07:00
}
}
return interjections , true
}
2021-07-05 14:01:39 -07:00
// interject merges 'in' with the provided interjections and writes them into
// 'out', which must already have the appropriate length.
2021-07-05 06:27:46 -07:00
func interject ( in , out [ ] int64 , interjections [ ] Interjection ) [ ] int64 {
2021-07-05 14:01:39 -07:00
var j int // Position in out.
var v int64 // The last value seen.
var interj int // The next interjection to process.
2021-07-01 23:20:30 -07:00
for i , d := range in {
if interj < len ( interjections ) && i == interjections [ interj ] . pos {
2021-07-05 14:01:39 -07:00
// We have an interjection!
// Add interjection.num new delta values such that their
// bucket values equate 0.
2021-07-01 23:20:30 -07:00
out [ j ] = int64 ( - v )
j ++
for x := 1 ; x < interjections [ interj ] . num ; x ++ {
out [ j ] = 0
j ++
}
interj ++
2021-07-05 14:01:39 -07:00
// Now save the value from the input. The delta value we
// should save is the original delta value + the last
// value of the point before the interjection (to undo
// the delta that was introduced by the interjection).
2021-07-01 23:20:30 -07:00
out [ j ] = d + v
j ++
v = d + v
continue
}
2021-07-05 14:01:39 -07:00
// If there was no interjection, the original delta is still
// valid.
2021-07-01 23:20:30 -07:00
out [ j ] = d
j ++
v += d
}
2021-07-05 14:01:39 -07:00
switch interj {
case len ( interjections ) :
// All interjections processed. Nothing more to do.
case len ( interjections ) - 1 :
// One more interjection to process at the end.
out [ j ] = int64 ( - v )
j ++
for x := 1 ; x < interjections [ interj ] . num ; x ++ {
out [ j ] = 0
j ++
}
default :
panic ( "unprocessed interjections left" )
}
2021-07-01 23:20:30 -07:00
return out
}