// Copyright 2024 The Prometheus Authors // Licensed under the Apache License, Version 2.0 (the "License"); // you may not use this file except in compliance with the License. // You may obtain a copy of the License at // // http://www.apache.org/licenses/LICENSE-2.0 // // Unless required by applicable law or agreed to in writing, software // distributed under the License is distributed on an "AS IS" BASIS, // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. // See the License for the specific language governing permissions and // limitations under the License. package textparse import ( "errors" "io" "math" "strconv" "strings" "github.com/prometheus/common/model" "github.com/prometheus/prometheus/model/exemplar" "github.com/prometheus/prometheus/model/histogram" "github.com/prometheus/prometheus/model/labels" "github.com/prometheus/prometheus/util/convertnhcb" ) type collectionState int const ( stateStart collectionState = iota stateCollecting stateEmitting ) // The NHCBParser wraps a Parser and converts classic histograms to native // histograms with custom buckets. // // Since Parser interface is line based, this parser needs to keep track // of the last classic histogram series it saw to collate them into a // single native histogram. // // Note: // - Only series that have the histogram metadata type are considered for // conversion. // - The classic series are also returned if keepClassicHistograms is true. type NHCBParser struct { // The parser we're wrapping. parser Parser // Option to keep classic histograms along with converted histograms. keepClassicHistograms bool // Labels builder. builder labels.ScratchBuilder // State of the parser. state collectionState // Caches the values from the underlying parser. // For Series and Histogram. bytes []byte ts *int64 value float64 h *histogram.Histogram fh *histogram.FloatHistogram // For Metric. lset labels.Labels metricString string // For Type. bName []byte typ model.MetricType // Caches the entry itself if we are inserting a converted NHCB // halfway through. entry Entry err error // Caches the values and metric for the inserted converted NHCB. bytesNHCB []byte hNHCB *histogram.Histogram fhNHCB *histogram.FloatHistogram lsetNHCB labels.Labels exemplars []exemplar.Exemplar ctNHCB *int64 metricStringNHCB string // Collates values from the classic histogram series to build // the converted histogram later. tempLsetNHCB labels.Labels tempNHCB convertnhcb.TempHistogram tempExemplars []exemplar.Exemplar tempExemplarCount int tempCT *int64 // Remembers the last base histogram metric name (assuming it's // a classic histogram) so we can tell if the next float series // is part of the same classic histogram. lastHistogramName string lastHistogramLabelsHash uint64 lastHistogramExponential bool // Reused buffer for hashing labels. hBuffer []byte } func NewNHCBParser(p Parser, st *labels.SymbolTable, keepClassicHistograms bool) Parser { return &NHCBParser{ parser: p, keepClassicHistograms: keepClassicHistograms, builder: labels.NewScratchBuilderWithSymbolTable(st, 16), tempNHCB: convertnhcb.NewTempHistogram(), } } func (p *NHCBParser) Series() ([]byte, *int64, float64) { return p.bytes, p.ts, p.value } func (p *NHCBParser) Histogram() ([]byte, *int64, *histogram.Histogram, *histogram.FloatHistogram) { if p.state == stateEmitting { return p.bytesNHCB, p.ts, p.hNHCB, p.fhNHCB } return p.bytes, p.ts, p.h, p.fh } func (p *NHCBParser) Help() ([]byte, []byte) { return p.parser.Help() } func (p *NHCBParser) Type() ([]byte, model.MetricType) { return p.bName, p.typ } func (p *NHCBParser) Unit() ([]byte, []byte) { return p.parser.Unit() } func (p *NHCBParser) Comment() []byte { return p.parser.Comment() } func (p *NHCBParser) Metric(l *labels.Labels) string { if p.state == stateEmitting { *l = p.lsetNHCB return p.metricStringNHCB } *l = p.lset return p.metricString } func (p *NHCBParser) Exemplar(ex *exemplar.Exemplar) bool { if p.state == stateEmitting { if len(p.exemplars) == 0 { return false } *ex = p.exemplars[0] p.exemplars = p.exemplars[1:] return true } return p.parser.Exemplar(ex) } func (p *NHCBParser) CreatedTimestamp() *int64 { switch p.state { case stateStart: if p.entry == EntrySeries || p.entry == EntryHistogram { return p.parser.CreatedTimestamp() } case stateCollecting: return p.tempCT case stateEmitting: return p.ctNHCB } return nil } func (p *NHCBParser) Next() (Entry, error) { if p.state == stateEmitting { p.state = stateStart if p.entry == EntrySeries { isNHCB := p.handleClassicHistogramSeries(p.lset) if isNHCB && !p.keepClassicHistograms { // Do not return the classic histogram series if it was converted to NHCB and we are not keeping classic histograms. return p.Next() } } return p.entry, p.err } p.entry, p.err = p.parser.Next() if p.err != nil { if errors.Is(p.err, io.EOF) && p.processNHCB() { return EntryHistogram, nil } return EntryInvalid, p.err } switch p.entry { case EntrySeries: p.bytes, p.ts, p.value = p.parser.Series() p.metricString = p.parser.Metric(&p.lset) // Check the label set to see if we can continue or need to emit the NHCB. var isNHCB bool if p.compareLabels() { // Labels differ. Check if we can emit the NHCB. if p.processNHCB() { return EntryHistogram, nil } isNHCB = p.handleClassicHistogramSeries(p.lset) } else { // Labels are the same. Check if after an exponential histogram. if p.lastHistogramExponential { isNHCB = false } else { isNHCB = p.handleClassicHistogramSeries(p.lset) } } if isNHCB && !p.keepClassicHistograms { // Do not return the classic histogram series if it was converted to NHCB and we are not keeping classic histograms. return p.Next() } return p.entry, p.err case EntryHistogram: p.bytes, p.ts, p.h, p.fh = p.parser.Histogram() p.metricString = p.parser.Metric(&p.lset) p.storeExponentialLabels() case EntryType: p.bName, p.typ = p.parser.Type() } if p.processNHCB() { return EntryHistogram, nil } return p.entry, p.err } // Return true if labels have changed and we should emit the NHCB. func (p *NHCBParser) compareLabels() bool { if p.state != stateCollecting { return false } if p.typ != model.MetricTypeHistogram { // Different metric type. return true } if p.lastHistogramName != convertnhcb.GetHistogramMetricBaseName(p.lset.Get(labels.MetricName)) { // Different metric name. return true } nextHash, _ := p.lset.HashWithoutLabels(p.hBuffer, labels.BucketLabel) // Different label values. return p.lastHistogramLabelsHash != nextHash } // Save the label set of the classic histogram without suffix and bucket `le` label. func (p *NHCBParser) storeClassicLabels() { p.lastHistogramName = convertnhcb.GetHistogramMetricBaseName(p.lset.Get(labels.MetricName)) p.lastHistogramLabelsHash, _ = p.lset.HashWithoutLabels(p.hBuffer, labels.BucketLabel) p.lastHistogramExponential = false } func (p *NHCBParser) storeExponentialLabels() { p.lastHistogramName = p.lset.Get(labels.MetricName) p.lastHistogramLabelsHash, _ = p.lset.HashWithoutLabels(p.hBuffer) p.lastHistogramExponential = true } // handleClassicHistogramSeries collates the classic histogram series to be converted to NHCB // if it is actually a classic histogram series (and not a normal float series) and if there // isn't already a native histogram with the same name (assuming it is always processed // right before the classic histograms) and returns true if the collation was done. func (p *NHCBParser) handleClassicHistogramSeries(lset labels.Labels) bool { if p.typ != model.MetricTypeHistogram { return false } mName := lset.Get(labels.MetricName) // Sanity check to ensure that the TYPE metadata entry name is the same as the base name. if convertnhcb.GetHistogramMetricBaseName(mName) != string(p.bName) { return false } switch { case strings.HasSuffix(mName, "_bucket") && lset.Has(labels.BucketLabel): le, err := strconv.ParseFloat(lset.Get(labels.BucketLabel), 64) if err == nil && !math.IsNaN(le) { p.processClassicHistogramSeries(lset, "_bucket", func(hist *convertnhcb.TempHistogram) { hist.BucketCounts[le] = p.value }) return true } case strings.HasSuffix(mName, "_count"): p.processClassicHistogramSeries(lset, "_count", func(hist *convertnhcb.TempHistogram) { hist.Count = p.value }) return true case strings.HasSuffix(mName, "_sum"): p.processClassicHistogramSeries(lset, "_sum", func(hist *convertnhcb.TempHistogram) { hist.Sum = p.value }) return true } return false } func (p *NHCBParser) processClassicHistogramSeries(lset labels.Labels, suffix string, updateHist func(*convertnhcb.TempHistogram)) { if p.state != stateCollecting { p.storeClassicLabels() p.tempCT = p.parser.CreatedTimestamp() p.state = stateCollecting } p.tempLsetNHCB = convertnhcb.GetHistogramMetricBase(lset, suffix) p.storeExemplars() updateHist(&p.tempNHCB) } func (p *NHCBParser) storeExemplars() { for ex := p.nextExemplarPtr(); p.parser.Exemplar(ex); ex = p.nextExemplarPtr() { p.tempExemplarCount++ } } func (p *NHCBParser) nextExemplarPtr() *exemplar.Exemplar { switch { case p.tempExemplarCount == len(p.tempExemplars)-1: // Reuse the previously allocated exemplar, it was not filled up. case len(p.tempExemplars) == cap(p.tempExemplars): // Let the runtime grow the slice. p.tempExemplars = append(p.tempExemplars, exemplar.Exemplar{}) default: // Take the next element into use. p.tempExemplars = p.tempExemplars[:len(p.tempExemplars)+1] } return &p.tempExemplars[len(p.tempExemplars)-1] } func (p *NHCBParser) swapExemplars() { p.exemplars = p.tempExemplars[:p.tempExemplarCount] p.tempExemplars = p.tempExemplars[:0] p.tempExemplarCount = 0 } // processNHCB converts the collated classic histogram series to NHCB and caches the info // to be returned to callers. Retruns true if the conversion was successful. func (p *NHCBParser) processNHCB() bool { if p.state != stateCollecting { return false } ub := make([]float64, 0, len(p.tempNHCB.BucketCounts)) for b := range p.tempNHCB.BucketCounts { ub = append(ub, b) } upperBounds, hBase := convertnhcb.ProcessUpperBoundsAndCreateBaseHistogram(ub, false) fhBase := hBase.ToFloat(nil) h, fh := convertnhcb.NewHistogram(p.tempNHCB, upperBounds, hBase, fhBase) if h != nil { if err := h.Validate(); err != nil { return false } p.hNHCB = h p.fhNHCB = nil } else if fh != nil { if err := fh.Validate(); err != nil { return false } p.hNHCB = nil p.fhNHCB = fh } p.metricStringNHCB = p.tempLsetNHCB.Get(labels.MetricName) + strings.ReplaceAll(p.tempLsetNHCB.DropMetricName().String(), ", ", ",") p.bytesNHCB = []byte(p.metricStringNHCB) p.lsetNHCB = p.tempLsetNHCB p.swapExemplars() p.ctNHCB = p.tempCT p.tempNHCB = convertnhcb.NewTempHistogram() p.state = stateEmitting p.tempCT = nil return true }