// Copyright 2021 The Prometheus Authors // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. package chunkenc import ( "github.com/prometheus/prometheus/pkg/histogram" ) func writeHistoChunkMeta(b *bstream, schema int32, zeroThreshold float64, posSpans, negSpans []histogram.Span) { putInt64VBBucket(b, int64(schema)) putFloat64VBBucket(b, zeroThreshold) putHistoChunkMetaSpans(b, posSpans) putHistoChunkMetaSpans(b, negSpans) } func putHistoChunkMetaSpans(b *bstream, spans []histogram.Span) { putInt64VBBucket(b, int64(len(spans))) for _, s := range spans { putInt64VBBucket(b, int64(s.Length)) putInt64VBBucket(b, int64(s.Offset)) } } func readHistoChunkMeta(b *bstreamReader) (int32, float64, []histogram.Span, []histogram.Span, error) { v, err := readInt64VBBucket(b) if err != nil { return 0, 0, nil, nil, err } schema := int32(v) zeroThreshold, err := readFloat64VBBucket(b) if err != nil { return 0, 0, nil, nil, err } posSpans, err := readHistoChunkMetaSpans(b) if err != nil { return 0, 0, nil, nil, err } negSpans, err := readHistoChunkMetaSpans(b) if err != nil { return 0, 0, nil, nil, err } return schema, zeroThreshold, posSpans, negSpans, nil } func readHistoChunkMetaSpans(b *bstreamReader) ([]histogram.Span, error) { var spans []histogram.Span num, err := readInt64VBBucket(b) if err != nil { return nil, err } for i := 0; i < int(num); i++ { length, err := readInt64VBBucket(b) if err != nil { return nil, err } offset, err := readInt64VBBucket(b) if err != nil { return nil, err } spans = append(spans, histogram.Span{ Length: uint32(length), Offset: int32(offset), }) } return spans, nil } type bucketIterator struct { spans []histogram.Span span int // span position of last yielded bucket bucket int // bucket position within span of last yielded bucket idx int // bucket index (globally across all spans) of last yielded bucket } func newBucketIterator(spans []histogram.Span) *bucketIterator { b := bucketIterator{ spans: spans, span: 0, bucket: -1, idx: -1, } if len(spans) > 0 { b.idx += int(spans[0].Offset) } return &b } func (b *bucketIterator) Next() (int, bool) { // we're already out of bounds if b.span >= len(b.spans) { return 0, false } try: if b.bucket < int(b.spans[b.span].Length-1) { // try to move within same span. b.bucket++ b.idx++ return b.idx, true } else if b.span < len(b.spans)-1 { // try to move from one span to the next b.span++ b.idx += int(b.spans[b.span].Offset + 1) b.bucket = 0 if b.spans[b.span].Length == 0 { // pathological case that should never happen. We can't use this span, let's try again. goto try } return b.idx, true } // we're out of options return 0, false } // Interjection describes that num new buckets are introduced before processing the pos'th delta from the original slice type Interjection struct { pos int num int } // compareSpans returns the interjections to convert a slice of deltas to a new slice representing an expanded set of buckets, or false if incompatible (e.g. if buckets were removed) // For example: // Let's say the old buckets look like this: // span syntax: [offset, length] // spans : [ 0 , 2 ] [2,1] [ 3 , 2 ] [3,1] [1,1] // bucket idx : [0] [1] 2 3 [4] 5 6 7 [8] [9] 10 11 12 [13] 14 [15] // raw values 6 3 3 2 4 5 1 // deltas 6 -3 0 -1 2 1 -4 // But now we introduce a new bucket layout. (carefully chosen example where we have a span appended, one unchanged[*], one prepended, and two merge - in that order) // [*] unchanged in terms of which bucket indices they represent. but to achieve that, their offset needs to change if "disrupted" by spans changing ahead of them // \/ this one is "unchanged" // spans : [ 0 , 3 ] [1,1] [ 1 , 4 ] [ 3 , 3 ] // bucket idx : [0] [1] [2] 3 [4] 5 [6] [7] [8] [9] 10 11 12 [13] [14] [15] // raw values 6 3 0 3 0 0 2 4 5 0 1 // deltas 6 -3 -3 3 -3 0 2 2 1 -5 1 // delta mods: / \ / \ / \ // note that whenever any new buckets are introduced, the subsequent "old" bucket needs to readjust its delta to the new base of 0 // thus, for the caller, who wants to transform the set of original deltas to a new set of deltas to match a new span layout that adds buckets, we simply // need to generate a list of interjections // note: within compareSpans we don't have to worry about the changes to the spans themselves, // thanks to the iterators, we get to work with the more useful bucket indices (which of course directly correspond to the buckets we have to adjust) func compareSpans(a, b []histogram.Span) ([]Interjection, bool) { ai := newBucketIterator(a) bi := newBucketIterator(b) var interjections []Interjection // when inter.num becomes > 0, this becomes a valid interjection that should be yielded when we finish a streak of new buckets var inter Interjection av, aok := ai.Next() bv, bok := bi.Next() loop: for { switch { case aok && bok: switch { case av == bv: // Both have an identical value. move on! // Finish WIP interjection and reset. if inter.num > 0 { interjections = append(interjections, inter) } inter.num = 0 av, aok = ai.Next() bv, bok = bi.Next() inter.pos++ case av < bv: // b misses a value that is in a. return interjections, false case av > bv: // a misses a value that is in b. Forward b and recompare. inter.num++ bv, bok = bi.Next() } case aok && !bok: // b misses a value that is in a. return interjections, false case !aok && bok: // a misses a value that is in b. Forward b and recompare. inter.num++ bv, bok = bi.Next() default: // Both iterators ran out. We're done. if inter.num > 0 { interjections = append(interjections, inter) } break loop } } return interjections, true } // interject merges 'in' with the provided interjections and writes them into // 'out', which must already have the appropriate length. func interject(in, out []int64, interjections []Interjection) []int64 { var j int // Position in out. var v int64 // The last value seen. var interj int // The next interjection to process. for i, d := range in { if interj < len(interjections) && i == interjections[interj].pos { // We have an interjection! // Add interjection.num new delta values such that their // bucket values equate 0. out[j] = int64(-v) j++ for x := 1; x < interjections[interj].num; x++ { out[j] = 0 j++ } interj++ // Now save the value from the input. The delta value we // should save is the original delta value + the last // value of the point before the interjection (to undo // the delta that was introduced by the interjection). out[j] = d + v j++ v = d + v continue } // If there was no interjection, the original delta is still // valid. out[j] = d j++ v += d } switch interj { case len(interjections): // All interjections processed. Nothing more to do. case len(interjections) - 1: // One more interjection to process at the end. out[j] = int64(-v) j++ for x := 1; x < interjections[interj].num; x++ { out[j] = 0 j++ } default: panic("unprocessed interjections left") } return out }