2021-06-29 14:45:23 -07:00
|
|
|
// Copyright 2021 The Prometheus Authors
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package textparse
|
|
|
|
|
|
|
|
import (
|
|
|
|
"bytes"
|
2023-11-02 13:45:07 -07:00
|
|
|
"errors"
|
2021-07-13 11:01:44 -07:00
|
|
|
"fmt"
|
2021-06-29 14:45:23 -07:00
|
|
|
"io"
|
2021-07-13 11:01:44 -07:00
|
|
|
"math"
|
2024-10-15 08:28:56 -07:00
|
|
|
"strconv"
|
2021-07-13 11:01:44 -07:00
|
|
|
"strings"
|
2024-10-15 08:28:56 -07:00
|
|
|
"sync"
|
2021-06-29 14:45:23 -07:00
|
|
|
"unicode/utf8"
|
|
|
|
|
2023-10-18 11:04:02 -07:00
|
|
|
"github.com/gogo/protobuf/types"
|
2021-06-29 14:45:23 -07:00
|
|
|
"github.com/prometheus/common/model"
|
2021-11-17 10:57:31 -08:00
|
|
|
|
|
|
|
"github.com/prometheus/prometheus/model/exemplar"
|
Style cleanup of all the changes in sparsehistogram so far
A lot of this code was hacked together, literally during a
hackathon. This commit intends not to change the code substantially,
but just make the code obey the usual style practices.
A (possibly incomplete) list of areas:
* Generally address linter warnings.
* The `pgk` directory is deprecated as per dev-summit. No new packages should
be added to it. I moved the new `pkg/histogram` package to `model`
anticipating what's proposed in #9478.
* Make the naming of the Sparse Histogram more consistent. Including
abbreviations, there were just too many names for it: SparseHistogram,
Histogram, Histo, hist, his, shs, h. The idea is to call it "Histogram" in
general. Only add "Sparse" if it is needed to avoid confusion with
conventional Histograms (which is rare because the TSDB really has no notion
of conventional Histograms). Use abbreviations only in local scope, and then
really abbreviate (not just removing three out of seven letters like in
"Histo"). This is in the spirit of
https://github.com/golang/go/wiki/CodeReviewComments#variable-names
* Several other minor name changes.
* A lot of formatting of doc comments. For one, following
https://github.com/golang/go/wiki/CodeReviewComments#comment-sentences
, but also layout question, anticipating how things will look like
when rendered by `godoc` (even where `godoc` doesn't render them
right now because they are for unexported types or not a doc comment
at all but just a normal code comment - consistency is queen!).
* Re-enabled `TestQueryLog` and `TestEndopints` (they pass now,
leaving them disabled was presumably an oversight).
* Bucket iterator for histogram.Histogram is now created with a
method.
* HistogramChunk.iterator now allows iterator recycling. (I think
@dieterbe only commented it out because he was confused by the
question in the comment.)
* HistogramAppender.Append panics now because we decided to treat
staleness marker differently.
Signed-off-by: beorn7 <beorn@grafana.com>
2021-10-09 06:57:07 -07:00
|
|
|
"github.com/prometheus/prometheus/model/histogram"
|
2021-11-17 10:57:31 -08:00
|
|
|
"github.com/prometheus/prometheus/model/labels"
|
2021-06-29 14:45:23 -07:00
|
|
|
|
|
|
|
dto "github.com/prometheus/prometheus/prompb/io/prometheus/client"
|
|
|
|
)
|
|
|
|
|
2024-10-15 08:28:56 -07:00
|
|
|
// floatFormatBufPool is exclusively used in formatOpenMetricsFloat.
|
|
|
|
var floatFormatBufPool = sync.Pool{
|
|
|
|
New: func() interface{} {
|
|
|
|
// To contain at most 17 digits and additional syntax for a float64.
|
|
|
|
b := make([]byte, 0, 24)
|
|
|
|
return &b
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
2025-02-13 02:38:35 -08:00
|
|
|
// ProtobufParser parses the old Prometheus protobuf format and present it
|
|
|
|
// as the text-style textparse.Parser interface.
|
|
|
|
//
|
|
|
|
// It uses a tailored streaming protobuf dto.MetricStreamingDecoder that
|
|
|
|
// reuses internal protobuf structs and allows direct unmarshalling to Prometheus
|
|
|
|
// types like labels.
|
2021-06-29 14:45:23 -07:00
|
|
|
type ProtobufParser struct {
|
2025-02-13 02:38:35 -08:00
|
|
|
dec *dto.MetricStreamingDecoder
|
|
|
|
|
|
|
|
// Used for both the string returned by Series and Histogram, as well as,
|
|
|
|
// metric family for Type, Unit and Help.
|
|
|
|
entryBytes *bytes.Buffer
|
|
|
|
|
|
|
|
lset labels.Labels
|
|
|
|
builder labels.ScratchBuilder // Held here to reduce allocations when building Labels.
|
|
|
|
|
2021-07-13 11:01:44 -07:00
|
|
|
// fieldPos is the position within a Summary or (legacy) Histogram. -2
|
2025-02-13 02:38:35 -08:00
|
|
|
// is the count. -1 is the sum. Otherwise, it is the index within
|
2021-07-13 11:01:44 -07:00
|
|
|
// quantiles/buckets.
|
2023-05-10 16:59:21 -07:00
|
|
|
fieldPos int
|
|
|
|
fieldsDone bool // true if no more fields of a Summary or (legacy) Histogram to be processed.
|
2023-07-12 09:42:02 -07:00
|
|
|
redoClassic bool // true after parsing a native histogram if we need to parse it again as a classic histogram.
|
2024-02-14 08:24:40 -08:00
|
|
|
// exemplarPos is the position within the exemplars slice of a native histogram.
|
|
|
|
exemplarPos int
|
2023-05-10 16:59:21 -07:00
|
|
|
|
2023-08-22 12:03:54 -07:00
|
|
|
// exemplarReturned is set to true each time an exemplar has been
|
|
|
|
// returned, and set back to false upon each Next() call.
|
|
|
|
exemplarReturned bool
|
|
|
|
|
2021-07-13 11:01:44 -07:00
|
|
|
// state is marked by the entry we are processing. EntryInvalid implies
|
|
|
|
// that we have to decode the next MetricFamily.
|
|
|
|
state Entry
|
|
|
|
|
2024-08-27 20:26:57 -07:00
|
|
|
// Whether to also parse a classic histogram that is also present as a
|
2023-05-10 16:59:21 -07:00
|
|
|
// native histogram.
|
|
|
|
parseClassicHistograms bool
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
|
Style cleanup of all the changes in sparsehistogram so far
A lot of this code was hacked together, literally during a
hackathon. This commit intends not to change the code substantially,
but just make the code obey the usual style practices.
A (possibly incomplete) list of areas:
* Generally address linter warnings.
* The `pgk` directory is deprecated as per dev-summit. No new packages should
be added to it. I moved the new `pkg/histogram` package to `model`
anticipating what's proposed in #9478.
* Make the naming of the Sparse Histogram more consistent. Including
abbreviations, there were just too many names for it: SparseHistogram,
Histogram, Histo, hist, his, shs, h. The idea is to call it "Histogram" in
general. Only add "Sparse" if it is needed to avoid confusion with
conventional Histograms (which is rare because the TSDB really has no notion
of conventional Histograms). Use abbreviations only in local scope, and then
really abbreviate (not just removing three out of seven letters like in
"Histo"). This is in the spirit of
https://github.com/golang/go/wiki/CodeReviewComments#variable-names
* Several other minor name changes.
* A lot of formatting of doc comments. For one, following
https://github.com/golang/go/wiki/CodeReviewComments#comment-sentences
, but also layout question, anticipating how things will look like
when rendered by `godoc` (even where `godoc` doesn't render them
right now because they are for unexported types or not a doc comment
at all but just a normal code comment - consistency is queen!).
* Re-enabled `TestQueryLog` and `TestEndopints` (they pass now,
leaving them disabled was presumably an oversight).
* Bucket iterator for histogram.Histogram is now created with a
method.
* HistogramChunk.iterator now allows iterator recycling. (I think
@dieterbe only commented it out because he was confused by the
question in the comment.)
* HistogramAppender.Append panics now because we decided to treat
staleness marker differently.
Signed-off-by: beorn7 <beorn@grafana.com>
2021-10-09 06:57:07 -07:00
|
|
|
// NewProtobufParser returns a parser for the payload in the byte slice.
|
2023-03-25 06:31:24 -07:00
|
|
|
func NewProtobufParser(b []byte, parseClassicHistograms bool, st *labels.SymbolTable) Parser {
|
2021-06-29 14:45:23 -07:00
|
|
|
return &ProtobufParser{
|
2025-02-13 02:38:35 -08:00
|
|
|
dec: dto.NewMetricStreamingDecoder(b),
|
|
|
|
entryBytes: &bytes.Buffer{},
|
|
|
|
builder: labels.NewScratchBuilderWithSymbolTable(st, 16), // TODO(bwplotka): Try base builder.
|
|
|
|
|
2023-05-10 16:59:21 -07:00
|
|
|
state: EntryInvalid,
|
|
|
|
parseClassicHistograms: parseClassicHistograms,
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Series returns the bytes of a series with a simple float64 as a
|
|
|
|
// value, the timestamp if set, and the value of the current sample.
|
|
|
|
func (p *ProtobufParser) Series() ([]byte, *int64, float64) {
|
|
|
|
var (
|
2025-02-13 02:38:35 -08:00
|
|
|
ts = &p.dec.TimestampMs // To save memory allocations, never nil.
|
2021-06-29 14:45:23 -07:00
|
|
|
v float64
|
|
|
|
)
|
2025-02-13 02:38:35 -08:00
|
|
|
switch p.dec.GetType() {
|
2021-06-29 14:45:23 -07:00
|
|
|
case dto.MetricType_COUNTER:
|
2025-02-13 02:38:35 -08:00
|
|
|
v = p.dec.GetCounter().GetValue()
|
2021-06-29 14:45:23 -07:00
|
|
|
case dto.MetricType_GAUGE:
|
2025-02-13 02:38:35 -08:00
|
|
|
v = p.dec.GetGauge().GetValue()
|
2021-06-29 14:45:23 -07:00
|
|
|
case dto.MetricType_UNTYPED:
|
2025-02-13 02:38:35 -08:00
|
|
|
v = p.dec.GetUntyped().GetValue()
|
2021-07-13 11:01:44 -07:00
|
|
|
case dto.MetricType_SUMMARY:
|
2025-02-13 02:38:35 -08:00
|
|
|
s := p.dec.GetSummary()
|
2021-07-13 11:01:44 -07:00
|
|
|
switch p.fieldPos {
|
|
|
|
case -2:
|
|
|
|
v = float64(s.GetSampleCount())
|
|
|
|
case -1:
|
|
|
|
v = s.GetSampleSum()
|
2023-07-18 15:59:41 -07:00
|
|
|
// Need to detect summaries without quantile here.
|
2021-08-30 22:17:57 -07:00
|
|
|
if len(s.GetQuantile()) == 0 {
|
|
|
|
p.fieldsDone = true
|
|
|
|
}
|
2021-07-13 11:01:44 -07:00
|
|
|
default:
|
|
|
|
v = s.GetQuantile()[p.fieldPos].GetValue()
|
|
|
|
}
|
2023-01-05 06:39:10 -08:00
|
|
|
case dto.MetricType_HISTOGRAM, dto.MetricType_GAUGE_HISTOGRAM:
|
2023-05-10 16:59:21 -07:00
|
|
|
// This should only happen for a classic histogram.
|
2025-02-13 02:38:35 -08:00
|
|
|
h := p.dec.GetHistogram()
|
2021-07-13 11:01:44 -07:00
|
|
|
switch p.fieldPos {
|
|
|
|
case -2:
|
2023-05-10 16:59:21 -07:00
|
|
|
v = h.GetSampleCountFloat()
|
|
|
|
if v == 0 {
|
|
|
|
v = float64(h.GetSampleCount())
|
|
|
|
}
|
2021-07-13 11:01:44 -07:00
|
|
|
case -1:
|
|
|
|
v = h.GetSampleSum()
|
|
|
|
default:
|
|
|
|
bb := h.GetBucket()
|
|
|
|
if p.fieldPos >= len(bb) {
|
2023-05-10 16:59:21 -07:00
|
|
|
v = h.GetSampleCountFloat()
|
|
|
|
if v == 0 {
|
|
|
|
v = float64(h.GetSampleCount())
|
|
|
|
}
|
2021-07-13 11:01:44 -07:00
|
|
|
} else {
|
2023-05-10 16:59:21 -07:00
|
|
|
v = bb[p.fieldPos].GetCumulativeCountFloat()
|
|
|
|
if v == 0 {
|
|
|
|
v = float64(bb[p.fieldPos].GetCumulativeCount())
|
|
|
|
}
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
|
|
|
}
|
2021-06-29 14:45:23 -07:00
|
|
|
default:
|
|
|
|
panic("encountered unexpected metric type, this is a bug")
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
if *ts != 0 {
|
|
|
|
return p.entryBytes.Bytes(), ts, v
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
2023-10-19 08:54:42 -07:00
|
|
|
// TODO(beorn7): We assume here that ts==0 means no timestamp. That's
|
|
|
|
// not true in general, but proto3 originally has no distinction between
|
|
|
|
// unset and default. At a later stage, the `optional` keyword was
|
|
|
|
// (re-)introduced in proto3, but gogo-protobuf never got updated to
|
|
|
|
// support it. (Note that setting `[(gogoproto.nullable) = true]` for
|
|
|
|
// the `timestamp_ms` field doesn't help, either.) We plan to migrate
|
|
|
|
// away from gogo-protobuf to an actively maintained protobuf
|
|
|
|
// implementation. Once that's done, we can simply use the `optional`
|
|
|
|
// keyword and check for the unset state explicitly.
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.entryBytes.Bytes(), nil, v
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
|
histograms: Add Compact method to the normal integer Histogram
And use the new method to call to compact Histograms during
parsing. This happens for both `Histogram` and `FloatHistogram`. In
this way, if targets decide to optimize the exposition size by merging
spans with empty buckets in between, we still get a normalized
results. It will also normalize away any valid but weird
representations like empty spans, spans with offset zero, and empty
buckets at the start or end of a span.
The implementation seemed easy at first as it just turns the
`compactBuckets` helper into a generic function (which now got its own
file). However, the integer Histograms have delta buckets instead of
absolute buckets, which had to be treated specially in the generic
`compactBuckets` function. To make sure it works, I have added plenty
of explicit tests for `Histogram` in addition to the `FloatHistogram`
tests.
I have also updated the doc comment for the `Compact` method.
Based on the insights now expressed in the doc comment, compacting
with a maxEmptyBuckets > 0 is rarely useful. Therefore, this commit
also sets the value to 0 in the two cases we were using 3 so far. We
might still want to reconsider, so I don't want to remove the
maxEmptyBuckets parameter right now.
Signed-off-by: beorn7 <beorn@grafana.com>
2022-09-27 04:04:16 -07:00
|
|
|
// Histogram returns the bytes of a series with a native histogram as a value,
|
|
|
|
// the timestamp if set, and the native histogram in the current sample.
|
|
|
|
//
|
|
|
|
// The Compact method is called before returning the Histogram (or FloatHistogram).
|
|
|
|
//
|
|
|
|
// If the SampleCountFloat or the ZeroCountFloat in the proto message is > 0,
|
|
|
|
// the histogram is parsed and returned as a FloatHistogram and nil is returned
|
|
|
|
// as the (integer) Histogram return value. Otherwise, it is parsed and returned
|
|
|
|
// as an (integer) Histogram and nil is returned as the FloatHistogram return
|
|
|
|
// value.
|
2022-08-25 08:07:41 -07:00
|
|
|
func (p *ProtobufParser) Histogram() ([]byte, *int64, *histogram.Histogram, *histogram.FloatHistogram) {
|
2021-06-29 14:45:23 -07:00
|
|
|
var (
|
2025-02-13 02:38:35 -08:00
|
|
|
ts = &p.dec.TimestampMs // To save memory allocations, never nil.
|
|
|
|
h = p.dec.GetHistogram()
|
2021-06-29 14:45:23 -07:00
|
|
|
)
|
2025-02-13 02:38:35 -08:00
|
|
|
|
2023-05-10 16:59:21 -07:00
|
|
|
if p.parseClassicHistograms && len(h.GetBucket()) > 0 {
|
|
|
|
p.redoClassic = true
|
|
|
|
}
|
2022-08-25 08:07:41 -07:00
|
|
|
if h.GetSampleCountFloat() > 0 || h.GetZeroCountFloat() > 0 {
|
|
|
|
// It is a float histogram.
|
|
|
|
fh := histogram.FloatHistogram{
|
2025-02-13 02:38:35 -08:00
|
|
|
Count: h.GetSampleCountFloat(),
|
|
|
|
Sum: h.GetSampleSum(),
|
|
|
|
ZeroThreshold: h.GetZeroThreshold(),
|
|
|
|
ZeroCount: h.GetZeroCountFloat(),
|
|
|
|
Schema: h.GetSchema(),
|
|
|
|
|
|
|
|
// Decoder reuses slices, so we need to copy.
|
2022-08-25 08:07:41 -07:00
|
|
|
PositiveSpans: make([]histogram.Span, len(h.GetPositiveSpan())),
|
2025-02-13 02:38:35 -08:00
|
|
|
PositiveBuckets: make([]float64, len(h.GetPositiveCount())),
|
2022-08-25 08:07:41 -07:00
|
|
|
NegativeSpans: make([]histogram.Span, len(h.GetNegativeSpan())),
|
2025-02-13 02:38:35 -08:00
|
|
|
NegativeBuckets: make([]float64, len(h.GetNegativeCount())),
|
2022-08-25 08:07:41 -07:00
|
|
|
}
|
|
|
|
for i, span := range h.GetPositiveSpan() {
|
|
|
|
fh.PositiveSpans[i].Offset = span.GetOffset()
|
|
|
|
fh.PositiveSpans[i].Length = span.GetLength()
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
for i, cnt := range h.GetPositiveCount() {
|
|
|
|
fh.PositiveBuckets[i] = cnt
|
|
|
|
}
|
2022-08-25 08:07:41 -07:00
|
|
|
for i, span := range h.GetNegativeSpan() {
|
|
|
|
fh.NegativeSpans[i].Offset = span.GetOffset()
|
|
|
|
fh.NegativeSpans[i].Length = span.GetLength()
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
for i, cnt := range h.GetNegativeCount() {
|
|
|
|
fh.NegativeBuckets[i] = cnt
|
|
|
|
}
|
|
|
|
if p.dec.GetType() == dto.MetricType_GAUGE_HISTOGRAM {
|
2023-01-10 07:25:23 -08:00
|
|
|
fh.CounterResetHint = histogram.GaugeType
|
|
|
|
}
|
histograms: Add Compact method to the normal integer Histogram
And use the new method to call to compact Histograms during
parsing. This happens for both `Histogram` and `FloatHistogram`. In
this way, if targets decide to optimize the exposition size by merging
spans with empty buckets in between, we still get a normalized
results. It will also normalize away any valid but weird
representations like empty spans, spans with offset zero, and empty
buckets at the start or end of a span.
The implementation seemed easy at first as it just turns the
`compactBuckets` helper into a generic function (which now got its own
file). However, the integer Histograms have delta buckets instead of
absolute buckets, which had to be treated specially in the generic
`compactBuckets` function. To make sure it works, I have added plenty
of explicit tests for `Histogram` in addition to the `FloatHistogram`
tests.
I have also updated the doc comment for the `Compact` method.
Based on the insights now expressed in the doc comment, compacting
with a maxEmptyBuckets > 0 is rarely useful. Therefore, this commit
also sets the value to 0 in the two cases we were using 3 so far. We
might still want to reconsider, so I don't want to remove the
maxEmptyBuckets parameter right now.
Signed-off-by: beorn7 <beorn@grafana.com>
2022-09-27 04:04:16 -07:00
|
|
|
fh.Compact(0)
|
2025-02-13 02:38:35 -08:00
|
|
|
if *ts != 0 {
|
|
|
|
return p.entryBytes.Bytes(), ts, nil, &fh
|
2022-08-25 08:07:41 -07:00
|
|
|
}
|
|
|
|
// Nasty hack: Assume that ts==0 means no timestamp. That's not true in
|
|
|
|
// general, but proto3 has no distinction between unset and
|
|
|
|
// default. Need to avoid in the final format.
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.entryBytes.Bytes(), nil, nil, &fh
|
2022-08-25 08:07:41 -07:00
|
|
|
}
|
|
|
|
|
2025-02-13 02:38:35 -08:00
|
|
|
// TODO(bwplotka): Create sync.Pool for those structs.
|
Style cleanup of all the changes in sparsehistogram so far
A lot of this code was hacked together, literally during a
hackathon. This commit intends not to change the code substantially,
but just make the code obey the usual style practices.
A (possibly incomplete) list of areas:
* Generally address linter warnings.
* The `pgk` directory is deprecated as per dev-summit. No new packages should
be added to it. I moved the new `pkg/histogram` package to `model`
anticipating what's proposed in #9478.
* Make the naming of the Sparse Histogram more consistent. Including
abbreviations, there were just too many names for it: SparseHistogram,
Histogram, Histo, hist, his, shs, h. The idea is to call it "Histogram" in
general. Only add "Sparse" if it is needed to avoid confusion with
conventional Histograms (which is rare because the TSDB really has no notion
of conventional Histograms). Use abbreviations only in local scope, and then
really abbreviate (not just removing three out of seven letters like in
"Histo"). This is in the spirit of
https://github.com/golang/go/wiki/CodeReviewComments#variable-names
* Several other minor name changes.
* A lot of formatting of doc comments. For one, following
https://github.com/golang/go/wiki/CodeReviewComments#comment-sentences
, but also layout question, anticipating how things will look like
when rendered by `godoc` (even where `godoc` doesn't render them
right now because they are for unexported types or not a doc comment
at all but just a normal code comment - consistency is queen!).
* Re-enabled `TestQueryLog` and `TestEndopints` (they pass now,
leaving them disabled was presumably an oversight).
* Bucket iterator for histogram.Histogram is now created with a
method.
* HistogramChunk.iterator now allows iterator recycling. (I think
@dieterbe only commented it out because he was confused by the
question in the comment.)
* HistogramAppender.Append panics now because we decided to treat
staleness marker differently.
Signed-off-by: beorn7 <beorn@grafana.com>
2021-10-09 06:57:07 -07:00
|
|
|
sh := histogram.Histogram{
|
2021-06-29 14:45:23 -07:00
|
|
|
Count: h.GetSampleCount(),
|
|
|
|
Sum: h.GetSampleSum(),
|
2022-07-19 09:11:33 -07:00
|
|
|
ZeroThreshold: h.GetZeroThreshold(),
|
|
|
|
ZeroCount: h.GetZeroCount(),
|
|
|
|
Schema: h.GetSchema(),
|
|
|
|
PositiveSpans: make([]histogram.Span, len(h.GetPositiveSpan())),
|
2025-02-13 02:38:35 -08:00
|
|
|
PositiveBuckets: make([]int64, len(h.GetPositiveDelta())),
|
2022-07-19 09:11:33 -07:00
|
|
|
NegativeSpans: make([]histogram.Span, len(h.GetNegativeSpan())),
|
2025-02-13 02:38:35 -08:00
|
|
|
NegativeBuckets: make([]int64, len(h.GetNegativeDelta())),
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
2022-07-19 09:11:33 -07:00
|
|
|
for i, span := range h.GetPositiveSpan() {
|
2021-06-29 14:45:23 -07:00
|
|
|
sh.PositiveSpans[i].Offset = span.GetOffset()
|
|
|
|
sh.PositiveSpans[i].Length = span.GetLength()
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
for i, cnt := range h.GetPositiveDelta() {
|
|
|
|
sh.PositiveBuckets[i] = cnt
|
|
|
|
}
|
2022-07-19 09:11:33 -07:00
|
|
|
for i, span := range h.GetNegativeSpan() {
|
2021-06-29 14:45:23 -07:00
|
|
|
sh.NegativeSpans[i].Offset = span.GetOffset()
|
|
|
|
sh.NegativeSpans[i].Length = span.GetLength()
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
for i, cnt := range h.GetNegativeDelta() {
|
|
|
|
sh.NegativeBuckets[i] = cnt
|
|
|
|
}
|
|
|
|
if p.dec.GetType() == dto.MetricType_GAUGE_HISTOGRAM {
|
2023-01-10 07:25:23 -08:00
|
|
|
sh.CounterResetHint = histogram.GaugeType
|
|
|
|
}
|
histograms: Add Compact method to the normal integer Histogram
And use the new method to call to compact Histograms during
parsing. This happens for both `Histogram` and `FloatHistogram`. In
this way, if targets decide to optimize the exposition size by merging
spans with empty buckets in between, we still get a normalized
results. It will also normalize away any valid but weird
representations like empty spans, spans with offset zero, and empty
buckets at the start or end of a span.
The implementation seemed easy at first as it just turns the
`compactBuckets` helper into a generic function (which now got its own
file). However, the integer Histograms have delta buckets instead of
absolute buckets, which had to be treated specially in the generic
`compactBuckets` function. To make sure it works, I have added plenty
of explicit tests for `Histogram` in addition to the `FloatHistogram`
tests.
I have also updated the doc comment for the `Compact` method.
Based on the insights now expressed in the doc comment, compacting
with a maxEmptyBuckets > 0 is rarely useful. Therefore, this commit
also sets the value to 0 in the two cases we were using 3 so far. We
might still want to reconsider, so I don't want to remove the
maxEmptyBuckets parameter right now.
Signed-off-by: beorn7 <beorn@grafana.com>
2022-09-27 04:04:16 -07:00
|
|
|
sh.Compact(0)
|
2025-02-13 02:38:35 -08:00
|
|
|
if *ts != 0 {
|
|
|
|
return p.entryBytes.Bytes(), ts, &sh, nil
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.entryBytes.Bytes(), nil, &sh, nil
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// Help returns the metric name and help text in the current entry.
|
|
|
|
// Must only be called after Next returned a help entry.
|
|
|
|
// The returned byte slices become invalid after the next call to Next.
|
|
|
|
func (p *ProtobufParser) Help() ([]byte, []byte) {
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.entryBytes.Bytes(), yoloBytes(p.dec.GetHelp())
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// Type returns the metric name and type in the current entry.
|
|
|
|
// Must only be called after Next returned a type entry.
|
|
|
|
// The returned byte slices become invalid after the next call to Next.
|
2023-11-22 06:39:21 -08:00
|
|
|
func (p *ProtobufParser) Type() ([]byte, model.MetricType) {
|
2025-02-13 02:38:35 -08:00
|
|
|
n := p.entryBytes.Bytes()
|
|
|
|
switch p.dec.GetType() {
|
2021-06-29 14:45:23 -07:00
|
|
|
case dto.MetricType_COUNTER:
|
2023-11-22 06:39:21 -08:00
|
|
|
return n, model.MetricTypeCounter
|
2021-06-29 14:45:23 -07:00
|
|
|
case dto.MetricType_GAUGE:
|
2023-11-22 06:39:21 -08:00
|
|
|
return n, model.MetricTypeGauge
|
2021-06-29 14:45:23 -07:00
|
|
|
case dto.MetricType_HISTOGRAM:
|
2023-11-22 06:39:21 -08:00
|
|
|
return n, model.MetricTypeHistogram
|
2023-01-05 06:39:10 -08:00
|
|
|
case dto.MetricType_GAUGE_HISTOGRAM:
|
2023-11-22 06:39:21 -08:00
|
|
|
return n, model.MetricTypeGaugeHistogram
|
2021-07-13 11:01:44 -07:00
|
|
|
case dto.MetricType_SUMMARY:
|
2023-11-22 06:39:21 -08:00
|
|
|
return n, model.MetricTypeSummary
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
2023-11-22 06:39:21 -08:00
|
|
|
return n, model.MetricTypeUnknown
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
|
2023-12-14 08:00:52 -08:00
|
|
|
// Unit returns the metric unit in the current entry.
|
|
|
|
// Must only be called after Next returned a unit entry.
|
|
|
|
// The returned byte slices become invalid after the next call to Next.
|
2021-06-29 14:45:23 -07:00
|
|
|
func (p *ProtobufParser) Unit() ([]byte, []byte) {
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.entryBytes.Bytes(), []byte(p.dec.GetUnit())
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// Comment always returns nil because comments aren't supported by the protobuf
|
|
|
|
// format.
|
|
|
|
func (p *ProtobufParser) Comment() []byte {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2025-02-12 07:47:56 -08:00
|
|
|
// Labels writes the labels of the current sample into the passed labels.
|
|
|
|
func (p *ProtobufParser) Labels(l *labels.Labels) {
|
2025-02-13 02:38:35 -08:00
|
|
|
*l = p.lset.Copy()
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
|
2021-07-13 06:11:26 -07:00
|
|
|
// Exemplar writes the exemplar of the current sample into the passed
|
2022-07-19 09:11:33 -07:00
|
|
|
// exemplar. It returns if an exemplar exists or not. In case of a native
|
2024-02-14 08:24:40 -08:00
|
|
|
// histogram, the exemplars in the native histogram will be returned.
|
|
|
|
// If this field is empty, the classic bucket section is still used for exemplars.
|
|
|
|
// To ingest all exemplars, call the Exemplar method repeatedly until it returns false.
|
2021-07-13 06:11:26 -07:00
|
|
|
func (p *ProtobufParser) Exemplar(ex *exemplar.Exemplar) bool {
|
2023-08-22 12:03:54 -07:00
|
|
|
if p.exemplarReturned && p.state == EntrySeries {
|
|
|
|
// We only ever return one exemplar per (non-native-histogram) series.
|
|
|
|
return false
|
|
|
|
}
|
2021-07-13 06:11:26 -07:00
|
|
|
var exProto *dto.Exemplar
|
2025-02-13 02:38:35 -08:00
|
|
|
switch p.dec.GetType() {
|
2021-07-13 06:11:26 -07:00
|
|
|
case dto.MetricType_COUNTER:
|
2025-02-13 02:38:35 -08:00
|
|
|
exProto = p.dec.GetCounter().GetExemplar()
|
2023-01-05 06:39:10 -08:00
|
|
|
case dto.MetricType_HISTOGRAM, dto.MetricType_GAUGE_HISTOGRAM:
|
2023-11-16 06:07:37 -08:00
|
|
|
isClassic := p.state == EntrySeries
|
2025-02-13 02:38:35 -08:00
|
|
|
if !isClassic && len(p.dec.GetHistogram().GetExemplars()) > 0 {
|
|
|
|
exs := p.dec.GetHistogram().GetExemplars()
|
2024-02-14 08:24:40 -08:00
|
|
|
for p.exemplarPos < len(exs) {
|
|
|
|
exProto = exs[p.exemplarPos]
|
|
|
|
p.exemplarPos++
|
|
|
|
if exProto != nil && exProto.GetTimestamp() != nil {
|
|
|
|
break
|
|
|
|
}
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
2024-02-14 08:24:40 -08:00
|
|
|
if exProto != nil && exProto.GetTimestamp() == nil {
|
|
|
|
return false
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
2024-02-14 08:24:40 -08:00
|
|
|
} else {
|
2025-02-13 02:38:35 -08:00
|
|
|
bb := p.dec.GetHistogram().GetBucket()
|
2024-02-14 08:24:40 -08:00
|
|
|
if p.fieldPos < 0 {
|
|
|
|
if isClassic {
|
|
|
|
return false // At _count or _sum.
|
|
|
|
}
|
|
|
|
p.fieldPos = 0 // Start at 1st bucket for native histograms.
|
|
|
|
}
|
|
|
|
for p.fieldPos < len(bb) {
|
|
|
|
exProto = bb[p.fieldPos].GetExemplar()
|
|
|
|
if isClassic {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
p.fieldPos++
|
|
|
|
// We deliberately drop exemplars with no timestamp only for native histograms.
|
|
|
|
if exProto != nil && (isClassic || exProto.GetTimestamp() != nil) {
|
|
|
|
break // Found a classic histogram exemplar or a native histogram exemplar with a timestamp.
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// If the last exemplar for native histograms has no timestamp, ignore it.
|
|
|
|
if !isClassic && exProto.GetTimestamp() == nil {
|
|
|
|
return false
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
2023-11-16 06:07:37 -08:00
|
|
|
}
|
2021-07-13 06:11:26 -07:00
|
|
|
default:
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if exProto == nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
ex.Value = exProto.GetValue()
|
|
|
|
if ts := exProto.GetTimestamp(); ts != nil {
|
|
|
|
ex.HasTs = true
|
|
|
|
ex.Ts = ts.GetSeconds()*1000 + int64(ts.GetNanos()/1_000_000)
|
|
|
|
}
|
2022-03-09 14:13:50 -08:00
|
|
|
p.builder.Reset()
|
2021-07-13 06:11:26 -07:00
|
|
|
for _, lp := range exProto.GetLabel() {
|
2022-03-09 14:13:50 -08:00
|
|
|
p.builder.Add(lp.GetName(), lp.GetValue())
|
2021-07-13 06:11:26 -07:00
|
|
|
}
|
2022-03-09 14:13:50 -08:00
|
|
|
p.builder.Sort()
|
|
|
|
ex.Labels = p.builder.Labels()
|
2023-08-22 12:03:54 -07:00
|
|
|
p.exemplarReturned = true
|
2021-07-13 06:11:26 -07:00
|
|
|
return true
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
|
2023-12-11 00:43:42 -08:00
|
|
|
// CreatedTimestamp returns CT or nil if CT is not present or
|
|
|
|
// invalid (as timestamp e.g. negative value) on counters, summaries or histograms.
|
|
|
|
func (p *ProtobufParser) CreatedTimestamp() *int64 {
|
|
|
|
var ct *types.Timestamp
|
2025-02-13 02:38:35 -08:00
|
|
|
switch p.dec.GetType() {
|
2023-10-18 11:04:02 -07:00
|
|
|
case dto.MetricType_COUNTER:
|
2025-02-13 02:38:35 -08:00
|
|
|
ct = p.dec.GetCounter().GetCreatedTimestamp()
|
2023-10-18 11:04:02 -07:00
|
|
|
case dto.MetricType_SUMMARY:
|
2025-02-13 02:38:35 -08:00
|
|
|
ct = p.dec.GetSummary().GetCreatedTimestamp()
|
2023-10-18 11:04:02 -07:00
|
|
|
case dto.MetricType_HISTOGRAM, dto.MetricType_GAUGE_HISTOGRAM:
|
2025-02-13 02:38:35 -08:00
|
|
|
ct = p.dec.GetHistogram().GetCreatedTimestamp()
|
2023-10-18 11:04:02 -07:00
|
|
|
default:
|
|
|
|
}
|
2023-12-11 00:43:42 -08:00
|
|
|
ctAsTime, err := types.TimestampFromProto(ct)
|
|
|
|
if err != nil {
|
|
|
|
// Errors means ct == nil or invalid timestamp, which we silently ignore.
|
|
|
|
return nil
|
2023-10-18 11:04:02 -07:00
|
|
|
}
|
2023-12-11 00:43:42 -08:00
|
|
|
ctMilis := ctAsTime.UnixMilli()
|
|
|
|
return &ctMilis
|
2023-10-18 11:04:02 -07:00
|
|
|
}
|
|
|
|
|
2021-06-29 14:45:23 -07:00
|
|
|
// Next advances the parser to the next "sample" (emulating the behavior of a
|
|
|
|
// text format parser). It returns (EntryInvalid, io.EOF) if no samples were
|
|
|
|
// read.
|
|
|
|
func (p *ProtobufParser) Next() (Entry, error) {
|
2023-08-22 12:03:54 -07:00
|
|
|
p.exemplarReturned = false
|
2021-06-29 14:45:23 -07:00
|
|
|
switch p.state {
|
2025-02-13 02:38:35 -08:00
|
|
|
// Invalid state occurs on:
|
|
|
|
// * First Next() call.
|
|
|
|
// * Recursive call that tells Next to move to the next metric family.
|
2021-06-29 14:45:23 -07:00
|
|
|
case EntryInvalid:
|
2024-09-02 08:42:48 -07:00
|
|
|
p.exemplarPos = 0
|
2021-07-13 11:01:44 -07:00
|
|
|
p.fieldPos = -2
|
2025-02-13 02:38:35 -08:00
|
|
|
|
|
|
|
if err := p.dec.NextMetricFamily(); err != nil {
|
2021-06-29 14:45:23 -07:00
|
|
|
return p.state, err
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
if err := p.dec.NextMetric(); err != nil {
|
|
|
|
// Skip empty metric families.
|
|
|
|
if errors.Is(err, io.EOF) {
|
|
|
|
return p.Next()
|
|
|
|
}
|
|
|
|
return EntryInvalid, err
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// We are at the beginning of a metric family. Put only the name
|
2025-02-13 02:38:35 -08:00
|
|
|
// into entryBytes and validate only name, help, and type for now.
|
|
|
|
name := p.dec.GetName()
|
2021-06-29 14:45:23 -07:00
|
|
|
if !model.IsValidMetricName(model.LabelValue(name)) {
|
2023-11-02 13:45:07 -07:00
|
|
|
return EntryInvalid, fmt.Errorf("invalid metric name: %s", name)
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
if help := p.dec.GetHelp(); !utf8.ValidString(help) {
|
2023-11-02 13:45:07 -07:00
|
|
|
return EntryInvalid, fmt.Errorf("invalid help for metric %q: %s", name, help)
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
switch p.dec.GetType() {
|
2023-01-05 06:21:18 -08:00
|
|
|
case dto.MetricType_COUNTER,
|
|
|
|
dto.MetricType_GAUGE,
|
|
|
|
dto.MetricType_HISTOGRAM,
|
2023-01-05 06:39:10 -08:00
|
|
|
dto.MetricType_GAUGE_HISTOGRAM,
|
2023-01-05 06:21:18 -08:00
|
|
|
dto.MetricType_SUMMARY,
|
|
|
|
dto.MetricType_UNTYPED:
|
|
|
|
// All good.
|
|
|
|
default:
|
2025-02-13 02:38:35 -08:00
|
|
|
return EntryInvalid, fmt.Errorf("unknown metric type for metric %q: %s", name, p.dec.GetType())
|
2023-01-05 06:21:18 -08:00
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
unit := p.dec.GetUnit()
|
2023-12-14 08:00:52 -08:00
|
|
|
if len(unit) > 0 {
|
2025-02-13 02:38:35 -08:00
|
|
|
if p.dec.GetType() == dto.MetricType_COUNTER && strings.HasSuffix(name, "_total") {
|
2023-12-28 06:41:38 -08:00
|
|
|
if !strings.HasSuffix(name[:len(name)-6], unit) || len(name)-6 < len(unit)+1 || name[len(name)-6-len(unit)-1] != '_' {
|
|
|
|
return EntryInvalid, fmt.Errorf("unit %q not a suffix of counter %q", unit, name)
|
|
|
|
}
|
|
|
|
} else if !strings.HasSuffix(name, unit) || len(name) < len(unit)+1 || name[len(name)-len(unit)-1] != '_' {
|
2023-12-20 00:41:37 -08:00
|
|
|
return EntryInvalid, fmt.Errorf("unit %q not a suffix of metric %q", unit, name)
|
2023-12-14 08:00:52 -08:00
|
|
|
}
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
p.entryBytes.Reset()
|
|
|
|
p.entryBytes.WriteString(name)
|
2021-06-29 14:45:23 -07:00
|
|
|
p.state = EntryHelp
|
|
|
|
case EntryHelp:
|
2025-02-13 02:38:35 -08:00
|
|
|
if p.dec.Unit != "" {
|
2024-10-07 04:17:44 -07:00
|
|
|
p.state = EntryUnit
|
|
|
|
} else {
|
|
|
|
p.state = EntryType
|
|
|
|
}
|
|
|
|
case EntryUnit:
|
2021-06-29 14:45:23 -07:00
|
|
|
p.state = EntryType
|
|
|
|
case EntryType:
|
2025-02-13 02:38:35 -08:00
|
|
|
t := p.dec.GetType()
|
2023-01-05 06:39:10 -08:00
|
|
|
if (t == dto.MetricType_HISTOGRAM || t == dto.MetricType_GAUGE_HISTOGRAM) &&
|
2025-02-13 02:38:35 -08:00
|
|
|
isNativeHistogram(p.dec.GetHistogram()) {
|
2021-06-29 14:45:23 -07:00
|
|
|
p.state = EntryHistogram
|
|
|
|
} else {
|
|
|
|
p.state = EntrySeries
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
if err := p.onSeriesOrHistogramUpdate(); err != nil {
|
2021-06-29 14:45:23 -07:00
|
|
|
return EntryInvalid, err
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
case EntrySeries:
|
|
|
|
// Potentially a second series in the metric family.
|
|
|
|
t := p.dec.GetType()
|
|
|
|
if t == dto.MetricType_SUMMARY ||
|
|
|
|
t == dto.MetricType_HISTOGRAM ||
|
|
|
|
t == dto.MetricType_GAUGE_HISTOGRAM {
|
|
|
|
// Non-trivial series (complex metrics, with magic suffixes).
|
|
|
|
|
|
|
|
// Did we iterate over all the classic representations fields?
|
|
|
|
// NOTE: p.fieldsDone is updated on p.onSeriesOrHistogramUpdate.
|
|
|
|
if !p.fieldsDone {
|
|
|
|
// Still some fields to iterate over.
|
|
|
|
p.fieldPos++
|
|
|
|
if err := p.onSeriesOrHistogramUpdate(); err != nil {
|
|
|
|
return EntryInvalid, err
|
|
|
|
}
|
|
|
|
return p.state, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Reset histogram fields.
|
2021-07-13 11:01:44 -07:00
|
|
|
p.fieldPos = -2
|
|
|
|
p.fieldsDone = false
|
2024-09-02 08:42:48 -07:00
|
|
|
p.exemplarPos = 0
|
2025-02-13 02:38:35 -08:00
|
|
|
|
2023-07-12 09:42:02 -07:00
|
|
|
// If this is a metric family containing native
|
2025-02-13 02:38:35 -08:00
|
|
|
// histograms, it means we are here thanks to redoClassic state.
|
|
|
|
// Return to native histograms for the consistent flow.
|
|
|
|
if (t == dto.MetricType_HISTOGRAM || t == dto.MetricType_GAUGE_HISTOGRAM) &&
|
|
|
|
isNativeHistogram(p.dec.GetHistogram()) {
|
2023-07-12 09:42:02 -07:00
|
|
|
p.state = EntryHistogram
|
|
|
|
}
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
// Is there another series?
|
|
|
|
if err := p.dec.NextMetric(); err != nil {
|
|
|
|
if errors.Is(err, io.EOF) {
|
|
|
|
p.state = EntryInvalid
|
|
|
|
return p.Next()
|
|
|
|
}
|
|
|
|
return EntryInvalid, err
|
|
|
|
}
|
|
|
|
if err := p.onSeriesOrHistogramUpdate(); err != nil {
|
|
|
|
return EntryInvalid, err
|
|
|
|
}
|
|
|
|
case EntryHistogram:
|
|
|
|
// Was Histogram() called and parseClassicHistograms is true?
|
|
|
|
if p.redoClassic {
|
|
|
|
p.redoClassic = false
|
|
|
|
p.fieldPos = -3
|
|
|
|
p.fieldsDone = false
|
|
|
|
p.state = EntrySeries
|
|
|
|
return p.Next() // Switch to classic histogram.
|
|
|
|
}
|
|
|
|
|
|
|
|
// Is there another series?
|
|
|
|
if err := p.dec.NextMetric(); err != nil {
|
|
|
|
if errors.Is(err, io.EOF) {
|
|
|
|
p.state = EntryInvalid
|
|
|
|
return p.Next()
|
|
|
|
}
|
|
|
|
return EntryInvalid, err
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
if err := p.onSeriesOrHistogramUpdate(); err != nil {
|
2021-06-29 14:45:23 -07:00
|
|
|
return EntryInvalid, err
|
|
|
|
}
|
|
|
|
default:
|
2023-11-02 13:45:07 -07:00
|
|
|
return EntryInvalid, fmt.Errorf("invalid protobuf parsing state: %d", p.state)
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
|
|
|
return p.state, nil
|
|
|
|
}
|
|
|
|
|
2025-02-13 02:38:35 -08:00
|
|
|
// onSeriesOrHistogramUpdate updates internal state before returning
|
|
|
|
// a series or histogram. It updates:
|
|
|
|
// * p.lset.
|
|
|
|
// * p.entryBytes.
|
|
|
|
// * p.fieldsDone depending on p.fieldPos.
|
|
|
|
func (p *ProtobufParser) onSeriesOrHistogramUpdate() error {
|
|
|
|
p.builder.Reset()
|
|
|
|
p.builder.Add(labels.MetricName, p.getMagicName())
|
|
|
|
|
|
|
|
if err := p.dec.Label(&p.builder); err != nil {
|
|
|
|
return err
|
2021-06-29 14:45:23 -07:00
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
|
|
|
|
if needed, name, value := p.getMagicLabel(); needed {
|
|
|
|
p.builder.Add(name, value)
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
|
|
|
|
// Sort labels to maintain the sorted labels invariant.
|
|
|
|
p.builder.Sort()
|
|
|
|
p.builder.Overwrite(&p.lset)
|
|
|
|
|
|
|
|
// entryBytes has to be unique for each series.
|
|
|
|
p.entryBytes.Reset()
|
|
|
|
p.lset.Range(func(l labels.Label) {
|
|
|
|
if l.Name == labels.MetricName {
|
|
|
|
p.entryBytes.WriteString(l.Value)
|
|
|
|
return
|
|
|
|
}
|
|
|
|
p.entryBytes.WriteByte(model.SeparatorByte)
|
|
|
|
p.entryBytes.WriteString(l.Name)
|
|
|
|
p.entryBytes.WriteByte(model.SeparatorByte)
|
|
|
|
p.entryBytes.WriteString(l.Value)
|
|
|
|
})
|
2021-06-29 14:45:23 -07:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-07-13 11:01:44 -07:00
|
|
|
// getMagicName usually just returns p.mf.GetType() but adds a magic suffix
|
|
|
|
// ("_count", "_sum", "_bucket") if needed according to the current parser
|
|
|
|
// state.
|
|
|
|
func (p *ProtobufParser) getMagicName() string {
|
2025-02-13 02:38:35 -08:00
|
|
|
t := p.dec.GetType()
|
2023-05-10 16:59:21 -07:00
|
|
|
if p.state == EntryHistogram || (t != dto.MetricType_HISTOGRAM && t != dto.MetricType_GAUGE_HISTOGRAM && t != dto.MetricType_SUMMARY) {
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.dec.GetName()
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
|
|
|
if p.fieldPos == -2 {
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.dec.GetName() + "_count"
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
|
|
|
if p.fieldPos == -1 {
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.dec.GetName() + "_sum"
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
2023-01-05 06:39:10 -08:00
|
|
|
if t == dto.MetricType_HISTOGRAM || t == dto.MetricType_GAUGE_HISTOGRAM {
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.dec.GetName() + "_bucket"
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
return p.dec.GetName()
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// getMagicLabel returns if a magic label ("quantile" or "le") is needed and, if
|
|
|
|
// so, its name and value. It also sets p.fieldsDone if applicable.
|
|
|
|
func (p *ProtobufParser) getMagicLabel() (bool, string, string) {
|
2025-02-13 02:38:35 -08:00
|
|
|
// Native histogram or _count and _sum series.
|
2021-07-13 11:01:44 -07:00
|
|
|
if p.state == EntryHistogram || p.fieldPos < 0 {
|
|
|
|
return false, "", ""
|
|
|
|
}
|
2025-02-13 02:38:35 -08:00
|
|
|
switch p.dec.GetType() {
|
2021-07-13 11:01:44 -07:00
|
|
|
case dto.MetricType_SUMMARY:
|
2025-02-13 02:38:35 -08:00
|
|
|
qq := p.dec.GetSummary().GetQuantile()
|
2021-07-13 11:01:44 -07:00
|
|
|
q := qq[p.fieldPos]
|
|
|
|
p.fieldsDone = p.fieldPos == len(qq)-1
|
|
|
|
return true, model.QuantileLabel, formatOpenMetricsFloat(q.GetQuantile())
|
2023-01-05 06:39:10 -08:00
|
|
|
case dto.MetricType_HISTOGRAM, dto.MetricType_GAUGE_HISTOGRAM:
|
2025-02-13 02:38:35 -08:00
|
|
|
bb := p.dec.GetHistogram().GetBucket()
|
2021-07-13 11:01:44 -07:00
|
|
|
if p.fieldPos >= len(bb) {
|
|
|
|
p.fieldsDone = true
|
|
|
|
return true, model.BucketLabel, "+Inf"
|
|
|
|
}
|
|
|
|
b := bb[p.fieldPos]
|
|
|
|
p.fieldsDone = math.IsInf(b.GetUpperBound(), +1)
|
|
|
|
return true, model.BucketLabel, formatOpenMetricsFloat(b.GetUpperBound())
|
|
|
|
}
|
|
|
|
return false, "", ""
|
|
|
|
}
|
|
|
|
|
2024-09-10 13:32:03 -07:00
|
|
|
// formatOpenMetricsFloat works like the usual Go string formatting of a float
|
2021-07-13 11:01:44 -07:00
|
|
|
// but appends ".0" if the resulting number would otherwise contain neither a
|
|
|
|
// "." nor an "e".
|
|
|
|
func formatOpenMetricsFloat(f float64) string {
|
|
|
|
// A few common cases hardcoded.
|
|
|
|
switch {
|
|
|
|
case f == 1:
|
|
|
|
return "1.0"
|
|
|
|
case f == 0:
|
|
|
|
return "0.0"
|
|
|
|
case f == -1:
|
|
|
|
return "-1.0"
|
|
|
|
case math.IsNaN(f):
|
|
|
|
return "NaN"
|
|
|
|
case math.IsInf(f, +1):
|
|
|
|
return "+Inf"
|
|
|
|
case math.IsInf(f, -1):
|
|
|
|
return "-Inf"
|
|
|
|
}
|
2024-10-15 08:28:56 -07:00
|
|
|
bp := floatFormatBufPool.Get().(*[]byte)
|
|
|
|
defer floatFormatBufPool.Put(bp)
|
|
|
|
|
|
|
|
*bp = strconv.AppendFloat((*bp)[:0], f, 'g', -1, 64)
|
|
|
|
if bytes.ContainsAny(*bp, "e.") {
|
|
|
|
return string(*bp)
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
2024-10-15 08:28:56 -07:00
|
|
|
*bp = append(*bp, '.', '0')
|
|
|
|
return string(*bp)
|
2021-07-13 11:01:44 -07:00
|
|
|
}
|
2021-07-19 10:58:04 -07:00
|
|
|
|
2023-07-20 08:29:31 -07:00
|
|
|
// isNativeHistogram returns false iff the provided histograms has no spans at
|
|
|
|
// all (neither positive nor negative) and a zero threshold of 0 and a zero
|
|
|
|
// count of 0. In principle, this could still be meant to be a native histogram
|
|
|
|
// with a zero threshold of 0 and no observations yet. In that case,
|
|
|
|
// instrumentation libraries should add a "no-op" span (e.g. length zero, offset
|
|
|
|
// zero) to signal that the histogram is meant to be parsed as a native
|
|
|
|
// histogram. Failing to do so will cause Prometheus to parse it as a classic
|
|
|
|
// histogram as long as no observations have happened.
|
2022-07-19 09:11:33 -07:00
|
|
|
func isNativeHistogram(h *dto.Histogram) bool {
|
2023-07-20 08:29:31 -07:00
|
|
|
return len(h.GetPositiveSpan()) > 0 ||
|
|
|
|
len(h.GetNegativeSpan()) > 0 ||
|
|
|
|
h.GetZeroThreshold() > 0 ||
|
|
|
|
h.GetZeroCount() > 0
|
2021-07-19 10:58:04 -07:00
|
|
|
}
|