From a632c73352a7e39d60b445700beb47d691549c3e Mon Sep 17 00:00:00 2001 From: Ganesh Vernekar <15064823+codesome@users.noreply.github.com> Date: Fri, 8 Jul 2022 18:53:23 +0530 Subject: [PATCH] Simplify how OutOfOrderTimeWindow works (#285) * Simplify how OutOfOrderTimeWindow works Signed-off-by: Ganesh Vernekar * Update test Signed-off-by: Ganesh Vernekar --- cmd/prometheus/main.go | 10 ------- tsdb/db.go | 3 +++ tsdb/db_test.go | 16 ++++++++--- tsdb/head_append.go | 61 +++++++++++++++++++----------------------- 4 files changed, 43 insertions(+), 47 deletions(-) diff --git a/cmd/prometheus/main.go b/cmd/prometheus/main.go index f3a7cf3314..5c28371d2e 100644 --- a/cmd/prometheus/main.go +++ b/cmd/prometheus/main.go @@ -314,12 +314,6 @@ func main() { serverOnlyFlag(a, "storage.tsdb.wal-compression", "Compress the tsdb WAL."). Hidden().Default("true").BoolVar(&cfg.tsdb.WALCompression) - serverOnlyFlag(a, "storage.tsdb.out-of-order-cap-min", "Minimum capacity for out of order chunks (in samples. between 0 and 255.)"). - Hidden().Default("4").IntVar(&cfg.tsdb.OutOfOrderCapMin) - - serverOnlyFlag(a, "storage.tsdb.out-of-order-cap-max", "Maximum capacity for out of order chunks (in samples. between 1 and 255.)"). - Hidden().Default("32").IntVar(&cfg.tsdb.OutOfOrderCapMax) - serverOnlyFlag(a, "storage.tsdb.head-chunks-write-queue-size", "Size of the queue through which head chunks are written to the disk to be m-mapped, 0 disables the queue completely. Experimental."). Default("0").IntVar(&cfg.tsdb.HeadChunksWriteQueueSize) @@ -1536,8 +1530,6 @@ type tsdbOptions struct { MinBlockDuration model.Duration MaxBlockDuration model.Duration OutOfOrderTimeWindow int64 - OutOfOrderCapMin int - OutOfOrderCapMax int EnableExemplarStorage bool MaxExemplars int64 EnableMemorySnapshotOnShutdown bool @@ -1561,8 +1553,6 @@ func (opts tsdbOptions) ToTSDBOptions() tsdb.Options { MaxExemplars: opts.MaxExemplars, EnableMemorySnapshotOnShutdown: opts.EnableMemorySnapshotOnShutdown, OutOfOrderTimeWindow: opts.OutOfOrderTimeWindow, - OutOfOrderCapMin: int64(opts.OutOfOrderCapMin), - OutOfOrderCapMax: int64(opts.OutOfOrderCapMax), } } diff --git a/tsdb/db.go b/tsdb/db.go index 450d8cd930..5852125c50 100644 --- a/tsdb/db.go +++ b/tsdb/db.go @@ -671,6 +671,9 @@ func validateOpts(opts *Options, rngs []int64) (*Options, []int64) { if opts.OutOfOrderCapMax <= 0 { opts.OutOfOrderCapMax = DefaultOutOfOrderCapMax } + if opts.OutOfOrderCapMin > opts.OutOfOrderCapMax { + opts.OutOfOrderCapMax = opts.OutOfOrderCapMin + } if opts.OutOfOrderTimeWindow < 0 { opts.OutOfOrderTimeWindow = 0 } diff --git a/tsdb/db_test.go b/tsdb/db_test.go index f230a30b8c..436f0ac10a 100644 --- a/tsdb/db_test.go +++ b/tsdb/db_test.go @@ -4261,8 +4261,18 @@ func TestOOOAppendAndQuery(t *testing.T) { // At the edge of time window, also it would be "out of bound" without the ooo support. addSample(s1, 60, 65, false) - addSample(s2, 50, 55, false) - verifyOOOMinMaxTimes(50, 265) + verifyOOOMinMaxTimes(60, 265) + testQuery() + + // This sample is not within the time window w.r.t. the head's maxt, but it is within the window + // w.r.t. the series' maxt. But we consider only head's maxt. + addSample(s2, 59, 59, true) + verifyOOOMinMaxTimes(60, 265) + testQuery() + + // Now the sample is within time window w.r.t. the head's maxt. + addSample(s2, 60, 65, false) + verifyOOOMinMaxTimes(60, 265) testQuery() // Out of time window again. @@ -4276,7 +4286,7 @@ func TestOOOAppendAndQuery(t *testing.T) { require.Equal(t, float64(4), prom_testutil.ToFloat64(db.head.metrics.chunksCreated)) addSample(s1, 180, 249, false) require.Equal(t, float64(6), prom_testutil.ToFloat64(db.head.metrics.chunksCreated)) - verifyOOOMinMaxTimes(50, 265) + verifyOOOMinMaxTimes(60, 265) testQuery() } diff --git a/tsdb/head_append.go b/tsdb/head_append.go index 6f66b169e1..6aa62083d6 100644 --- a/tsdb/head_append.go +++ b/tsdb/head_append.go @@ -326,49 +326,42 @@ func (a *headAppender) Append(ref storage.SeriesRef, lset labels.Labels, t int64 // The sample belongs to the out of order chunk if we return true and no error. // An error signifies the sample cannot be handled. func (s *memSeries) appendable(t int64, v float64, headMaxt, minValidTime, oooTimeWindow int64) (isOutOfOrder bool, delta int64, err error) { - msMaxt := s.maxTime() - if msMaxt == math.MinInt64 { - // The series has no sample and was freshly created. - if t >= minValidTime { - // We can append it in the in-order chunk. + // Check if we can append in the in-order chunk. + if t >= minValidTime { + if s.head() == nil { + // The series has no sample and was freshly created. return false, 0, nil } - - // We cannot append it in the in-order head. So we check the oooTimeWindow - // w.r.t. the head's maxt. - // -1 because for the first sample in the Head, headMaxt will be equal to t. - msMaxt = headMaxt - 1 - } - - if t > msMaxt { - return false, 0, nil - } - - if t < msMaxt-oooTimeWindow { - if oooTimeWindow > 0 { - return true, msMaxt - t, storage.ErrTooOldSample + msMaxt := s.maxTime() + if t > msMaxt { + return false, 0, nil } - if t < minValidTime { - return false, msMaxt - t, storage.ErrOutOfBounds + if t == msMaxt { + // We are allowing exact duplicates as we can encounter them in valid cases + // like federation and erroring out at that time would be extremely noisy. + // This only checks against the latest in-order sample. + // The OOO headchunk has its own method to detect these duplicates + if math.Float64bits(s.sampleBuf[3].v) != math.Float64bits(v) { + return false, 0, storage.ErrDuplicateSampleForTimestamp + } + // Sample is identical (ts + value) with most current (highest ts) sample in sampleBuf. + return false, 0, nil } - return false, msMaxt - t, storage.ErrOutOfOrderSample } - if t != msMaxt || s.head() == nil { - // Sample is ooo and within time window OR series has no active chunk to check for duplicate sample. - return true, msMaxt - t, nil + // The sample cannot go in the in-order chunk. Check if it can go in the out-of-order chunk. + if oooTimeWindow > 0 && t >= headMaxt-oooTimeWindow { + return true, headMaxt - t, nil } - // We are allowing exact duplicates as we can encounter them in valid cases - // like federation and erroring out at that time would be extremely noisy. - // this only checks against the latest in-order sample. - // the OOO headchunk has its own method to detect these duplicates - if math.Float64bits(s.sampleBuf[3].v) != math.Float64bits(v) { - return false, 0, storage.ErrDuplicateSampleForTimestamp + // The sample cannot go in both in-order and out-of-order chunk. + if oooTimeWindow > 0 { + return true, headMaxt - t, storage.ErrTooOldSample } - - // sample is identical (ts + value) with most current (highest ts) sample in sampleBuf - return false, 0, nil + if t < minValidTime { + return false, headMaxt - t, storage.ErrOutOfBounds + } + return false, headMaxt - t, storage.ErrOutOfOrderSample } // AppendExemplar for headAppender assumes the series ref already exists, and so it doesn't