2017-05-10 02:44:13 -07:00
|
|
|
// Copyright 2013 The Prometheus Authors
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
// you may not use this file except in compliance with the License.
|
|
|
|
// You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
|
|
|
|
|
|
|
package remote
|
|
|
|
|
|
|
|
import (
|
2018-05-29 01:51:29 -07:00
|
|
|
"context"
|
2017-05-10 02:44:13 -07:00
|
|
|
"fmt"
|
2019-02-13 17:11:17 -08:00
|
|
|
"io/ioutil"
|
|
|
|
"os"
|
2017-10-23 13:28:17 -07:00
|
|
|
"reflect"
|
2017-05-10 02:44:13 -07:00
|
|
|
"sync"
|
|
|
|
"sync/atomic"
|
|
|
|
"testing"
|
|
|
|
"time"
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
"github.com/gogo/protobuf/proto"
|
|
|
|
"github.com/golang/snappy"
|
|
|
|
"github.com/stretchr/testify/require"
|
|
|
|
|
2017-05-10 02:44:13 -07:00
|
|
|
"github.com/prometheus/common/model"
|
2017-10-23 06:57:44 -07:00
|
|
|
"github.com/prometheus/prometheus/config"
|
2017-10-23 13:28:17 -07:00
|
|
|
"github.com/prometheus/prometheus/prompb"
|
2018-09-07 14:26:04 -07:00
|
|
|
"github.com/prometheus/prometheus/util/testutil"
|
|
|
|
"github.com/prometheus/tsdb"
|
|
|
|
"github.com/prometheus/tsdb/labels"
|
2017-05-10 02:44:13 -07:00
|
|
|
)
|
|
|
|
|
2018-05-23 07:03:54 -07:00
|
|
|
const defaultFlushDeadline = 1 * time.Minute
|
|
|
|
|
2017-05-10 02:44:13 -07:00
|
|
|
func TestSampleDelivery(t *testing.T) {
|
|
|
|
// Let's create an even number of send batches so we don't run into the
|
|
|
|
// batch timeout case.
|
2017-10-23 06:57:44 -07:00
|
|
|
n := config.DefaultQueueConfig.Capacity * 2
|
2018-09-07 14:26:04 -07:00
|
|
|
samples, series := createTimeseries(n)
|
2017-05-10 02:44:13 -07:00
|
|
|
|
|
|
|
c := NewTestStorageClient()
|
2018-09-07 14:26:04 -07:00
|
|
|
c.expectSamples(samples[:len(samples)/2], series)
|
2017-05-10 02:44:13 -07:00
|
|
|
|
2017-10-23 06:57:44 -07:00
|
|
|
cfg := config.DefaultQueueConfig
|
2018-09-07 14:26:04 -07:00
|
|
|
cfg.BatchSendDeadline = model.Duration(100 * time.Millisecond)
|
2017-05-10 02:44:13 -07:00
|
|
|
cfg.MaxShards = 1
|
2018-09-07 14:26:04 -07:00
|
|
|
var temp int64
|
2019-02-13 17:11:17 -08:00
|
|
|
|
|
|
|
dir, err := ioutil.TempDir("", "TestSampleDeliver")
|
|
|
|
testutil.Ok(t, err)
|
|
|
|
defer os.RemoveAll(dir)
|
|
|
|
|
2019-02-15 01:54:01 -08:00
|
|
|
m := NewQueueManager(nil, dir, newEWMARate(ewmaWeight, shardUpdateDuration), &temp, cfg, nil, nil, c, defaultFlushDeadline)
|
2018-09-07 14:26:04 -07:00
|
|
|
m.seriesLabels = refSeriesToLabelsProto(series)
|
2017-05-10 02:44:13 -07:00
|
|
|
|
|
|
|
// These should be received by the client.
|
|
|
|
m.Start()
|
2018-09-07 14:26:04 -07:00
|
|
|
m.Append(samples[:len(samples)/2])
|
2017-05-10 02:44:13 -07:00
|
|
|
defer m.Stop()
|
|
|
|
|
|
|
|
c.waitForExpectedSamples(t)
|
2018-09-07 14:26:04 -07:00
|
|
|
m.Append(samples[len(samples)/2:])
|
|
|
|
c.expectSamples(samples[len(samples)/2:], series)
|
|
|
|
c.waitForExpectedSamples(t)
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
|
|
|
|
2018-03-12 08:35:43 -07:00
|
|
|
func TestSampleDeliveryTimeout(t *testing.T) {
|
2018-03-12 09:48:51 -07:00
|
|
|
// Let's send one less sample than batch size, and wait the timeout duration
|
2018-09-07 14:26:04 -07:00
|
|
|
n := 9
|
|
|
|
samples, series := createTimeseries(n)
|
2018-03-12 08:35:43 -07:00
|
|
|
c := NewTestStorageClient()
|
|
|
|
|
|
|
|
cfg := config.DefaultQueueConfig
|
|
|
|
cfg.MaxShards = 1
|
2018-08-24 07:55:21 -07:00
|
|
|
cfg.BatchSendDeadline = model.Duration(100 * time.Millisecond)
|
2018-09-07 14:26:04 -07:00
|
|
|
var temp int64
|
2019-02-13 17:11:17 -08:00
|
|
|
|
|
|
|
dir, err := ioutil.TempDir("", "TestSampleDeliveryTimeout")
|
|
|
|
testutil.Ok(t, err)
|
|
|
|
defer os.RemoveAll(dir)
|
|
|
|
|
2019-02-15 01:54:01 -08:00
|
|
|
m := NewQueueManager(nil, dir, newEWMARate(ewmaWeight, shardUpdateDuration), &temp, cfg, nil, nil, c, defaultFlushDeadline)
|
2018-09-07 14:26:04 -07:00
|
|
|
m.seriesLabels = refSeriesToLabelsProto(series)
|
2018-03-12 08:35:43 -07:00
|
|
|
m.Start()
|
|
|
|
defer m.Stop()
|
|
|
|
|
|
|
|
// Send the samples twice, waiting for the samples in the meantime.
|
2018-09-07 14:26:04 -07:00
|
|
|
c.expectSamples(samples, series)
|
|
|
|
m.Append(samples)
|
2018-03-12 08:35:43 -07:00
|
|
|
c.waitForExpectedSamples(t)
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
c.expectSamples(samples, series)
|
|
|
|
m.Append(samples)
|
2018-03-12 08:35:43 -07:00
|
|
|
c.waitForExpectedSamples(t)
|
|
|
|
}
|
|
|
|
|
2017-05-10 02:44:13 -07:00
|
|
|
func TestSampleDeliveryOrder(t *testing.T) {
|
|
|
|
ts := 10
|
2017-10-23 06:57:44 -07:00
|
|
|
n := config.DefaultQueueConfig.MaxSamplesPerSend * ts
|
2018-09-07 14:26:04 -07:00
|
|
|
samples := make([]tsdb.RefSample, 0, n)
|
|
|
|
series := make([]tsdb.RefSeries, 0, n)
|
2017-05-10 02:44:13 -07:00
|
|
|
for i := 0; i < n; i++ {
|
2018-09-07 14:26:04 -07:00
|
|
|
name := fmt.Sprintf("test_metric_%d", i%ts)
|
|
|
|
samples = append(samples, tsdb.RefSample{
|
|
|
|
Ref: uint64(i),
|
|
|
|
T: int64(i),
|
|
|
|
V: float64(i),
|
|
|
|
})
|
|
|
|
series = append(series, tsdb.RefSeries{
|
|
|
|
Ref: uint64(i),
|
|
|
|
Labels: labels.Labels{labels.Label{Name: "__name__", Value: name}},
|
2017-05-10 02:44:13 -07:00
|
|
|
})
|
|
|
|
}
|
|
|
|
|
|
|
|
c := NewTestStorageClient()
|
2018-09-07 14:26:04 -07:00
|
|
|
c.expectSamples(samples, series)
|
|
|
|
var temp int64
|
2019-02-13 17:11:17 -08:00
|
|
|
|
|
|
|
dir, err := ioutil.TempDir("", "TestSampleDeliveryOrder")
|
|
|
|
testutil.Ok(t, err)
|
|
|
|
defer os.RemoveAll(dir)
|
|
|
|
|
2019-02-15 01:54:01 -08:00
|
|
|
m := NewQueueManager(nil, dir, newEWMARate(ewmaWeight, shardUpdateDuration), &temp, config.DefaultQueueConfig, nil, nil, c, defaultFlushDeadline)
|
2018-09-07 14:26:04 -07:00
|
|
|
m.seriesLabels = refSeriesToLabelsProto(series)
|
2017-05-10 02:44:13 -07:00
|
|
|
|
|
|
|
m.Start()
|
|
|
|
defer m.Stop()
|
2018-09-07 14:26:04 -07:00
|
|
|
// These should be received by the client.
|
|
|
|
m.Append(samples)
|
2017-05-10 02:44:13 -07:00
|
|
|
c.waitForExpectedSamples(t)
|
|
|
|
}
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func TestShutdown(t *testing.T) {
|
|
|
|
deadline := 5 * time.Second
|
|
|
|
c := NewTestBlockedStorageClient()
|
2017-05-10 02:44:13 -07:00
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
var temp int64
|
2019-02-13 17:11:17 -08:00
|
|
|
|
|
|
|
dir, err := ioutil.TempDir("", "TestShutdown")
|
|
|
|
testutil.Ok(t, err)
|
|
|
|
defer os.RemoveAll(dir)
|
|
|
|
|
2019-02-15 01:54:01 -08:00
|
|
|
m := NewQueueManager(nil, dir, newEWMARate(ewmaWeight, shardUpdateDuration), &temp, config.DefaultQueueConfig, nil, nil, c, deadline)
|
2018-09-07 14:26:04 -07:00
|
|
|
samples, series := createTimeseries(2 * config.DefaultQueueConfig.MaxSamplesPerSend)
|
|
|
|
m.seriesLabels = refSeriesToLabelsProto(series)
|
|
|
|
m.Start()
|
|
|
|
|
|
|
|
// Append blocks to guarantee delivery, so we do it in the background.
|
|
|
|
go func() {
|
|
|
|
m.Append(samples)
|
|
|
|
}()
|
|
|
|
time.Sleep(1 * time.Second)
|
|
|
|
|
|
|
|
// Test to ensure that Stop doesn't block.
|
|
|
|
start := time.Now()
|
|
|
|
m.Stop()
|
|
|
|
// The samples will never be delivered, so duration should
|
|
|
|
// be at least equal to deadline, otherwise the flush deadline
|
|
|
|
// was not respected.
|
|
|
|
duration := time.Since(start)
|
|
|
|
if duration > time.Duration(deadline+(deadline/10)) {
|
|
|
|
t.Errorf("Took too long to shutdown: %s > %s", duration, deadline)
|
|
|
|
}
|
|
|
|
if duration < time.Duration(deadline) {
|
|
|
|
t.Errorf("Shutdown occurred before flush deadline: %s < %s", duration, deadline)
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func TestSeriesReset(t *testing.T) {
|
|
|
|
c := NewTestBlockedStorageClient()
|
|
|
|
deadline := 5 * time.Second
|
|
|
|
var temp int64
|
|
|
|
numSegments := 4
|
|
|
|
numSeries := 25
|
|
|
|
|
2019-02-13 17:11:17 -08:00
|
|
|
dir, err := ioutil.TempDir("", "TestSeriesReset")
|
|
|
|
testutil.Ok(t, err)
|
|
|
|
defer os.RemoveAll(dir)
|
|
|
|
|
2019-02-15 01:54:01 -08:00
|
|
|
m := NewQueueManager(nil, dir, newEWMARate(ewmaWeight, shardUpdateDuration), &temp, config.DefaultQueueConfig, nil, nil, c, deadline)
|
2018-09-07 14:26:04 -07:00
|
|
|
for i := 0; i < numSegments; i++ {
|
|
|
|
series := []tsdb.RefSeries{}
|
|
|
|
for j := 0; j < numSeries; j++ {
|
|
|
|
series = append(series, tsdb.RefSeries{Ref: uint64((i * 100) + j), Labels: labels.Labels{labels.Label{Name: "a", Value: "a"}}})
|
|
|
|
}
|
|
|
|
m.StoreSeries(series, i)
|
2018-05-29 01:51:29 -07:00
|
|
|
}
|
2018-09-07 14:26:04 -07:00
|
|
|
testutil.Equals(t, numSegments*numSeries, len(m.seriesLabels))
|
|
|
|
m.SeriesReset(2)
|
|
|
|
testutil.Equals(t, numSegments*numSeries/2, len(m.seriesLabels))
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func TestReshard(t *testing.T) {
|
|
|
|
size := 10 // Make bigger to find more races.
|
|
|
|
n := config.DefaultQueueConfig.Capacity * size
|
|
|
|
samples, series := createTimeseries(n)
|
|
|
|
|
|
|
|
c := NewTestStorageClient()
|
|
|
|
c.expectSamples(samples, series)
|
|
|
|
|
|
|
|
cfg := config.DefaultQueueConfig
|
|
|
|
cfg.MaxShards = 1
|
|
|
|
|
|
|
|
var temp int64
|
2019-02-13 17:11:17 -08:00
|
|
|
|
|
|
|
dir, err := ioutil.TempDir("", "TestReshard")
|
|
|
|
testutil.Ok(t, err)
|
|
|
|
defer os.RemoveAll(dir)
|
|
|
|
|
2019-02-15 01:54:01 -08:00
|
|
|
m := NewQueueManager(nil, dir, newEWMARate(ewmaWeight, shardUpdateDuration), &temp, cfg, nil, nil, c, defaultFlushDeadline)
|
2018-09-07 14:26:04 -07:00
|
|
|
m.seriesLabels = refSeriesToLabelsProto(series)
|
|
|
|
|
|
|
|
m.Start()
|
|
|
|
defer m.Stop()
|
|
|
|
|
|
|
|
go func() {
|
|
|
|
for i := 0; i < len(samples); i += config.DefaultQueueConfig.Capacity {
|
|
|
|
sent := m.Append(samples[i : i+config.DefaultQueueConfig.Capacity])
|
|
|
|
require.True(t, sent)
|
|
|
|
time.Sleep(100 * time.Millisecond)
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
|
|
|
for i := 1; i < len(samples)/config.DefaultQueueConfig.Capacity; i++ {
|
|
|
|
m.shards.stop()
|
|
|
|
m.shards.start(i)
|
|
|
|
time.Sleep(100 * time.Millisecond)
|
|
|
|
}
|
|
|
|
|
|
|
|
c.waitForExpectedSamples(t)
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func createTimeseries(n int) ([]tsdb.RefSample, []tsdb.RefSeries) {
|
|
|
|
samples := make([]tsdb.RefSample, 0, n)
|
|
|
|
series := make([]tsdb.RefSeries, 0, n)
|
|
|
|
for i := 0; i < n; i++ {
|
|
|
|
name := fmt.Sprintf("test_metric_%d", i)
|
|
|
|
samples = append(samples, tsdb.RefSample{
|
|
|
|
Ref: uint64(i),
|
|
|
|
T: int64(i),
|
|
|
|
V: float64(i),
|
|
|
|
})
|
|
|
|
series = append(series, tsdb.RefSeries{
|
|
|
|
Ref: uint64(i),
|
|
|
|
Labels: labels.Labels{labels.Label{Name: "__name__", Value: name}},
|
|
|
|
})
|
|
|
|
}
|
|
|
|
return samples, series
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func getSeriesNameFromRef(r tsdb.RefSeries) string {
|
|
|
|
for _, l := range r.Labels {
|
|
|
|
if l.Name == "__name__" {
|
|
|
|
return l.Value
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return ""
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func refSeriesToLabelsProto(series []tsdb.RefSeries) map[uint64][]prompb.Label {
|
|
|
|
result := make(map[uint64][]prompb.Label)
|
|
|
|
for _, s := range series {
|
|
|
|
for _, l := range s.Labels {
|
|
|
|
result[s.Ref] = append(result[s.Ref], prompb.Label{
|
|
|
|
Name: l.Name,
|
|
|
|
Value: l.Value,
|
|
|
|
})
|
|
|
|
}
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
2018-09-07 14:26:04 -07:00
|
|
|
return result
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
type TestStorageClient struct {
|
|
|
|
receivedSamples map[string][]prompb.Sample
|
|
|
|
expectedSamples map[string][]prompb.Sample
|
|
|
|
wg sync.WaitGroup
|
|
|
|
mtx sync.Mutex
|
|
|
|
}
|
2017-05-10 02:44:13 -07:00
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func NewTestStorageClient() *TestStorageClient {
|
|
|
|
return &TestStorageClient{
|
|
|
|
receivedSamples: map[string][]prompb.Sample{},
|
|
|
|
expectedSamples: map[string][]prompb.Sample{},
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
2018-09-07 14:26:04 -07:00
|
|
|
}
|
2017-05-10 02:44:13 -07:00
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func (c *TestStorageClient) expectSamples(ss []tsdb.RefSample, series []tsdb.RefSeries) {
|
|
|
|
c.mtx.Lock()
|
|
|
|
defer c.mtx.Unlock()
|
2017-05-10 02:44:13 -07:00
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
c.expectedSamples = map[string][]prompb.Sample{}
|
|
|
|
c.receivedSamples = map[string][]prompb.Sample{}
|
2017-05-10 02:44:13 -07:00
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
for _, s := range ss {
|
|
|
|
seriesName := getSeriesNameFromRef(series[s.Ref])
|
|
|
|
c.expectedSamples[seriesName] = append(c.expectedSamples[seriesName], prompb.Sample{
|
|
|
|
Timestamp: s.T,
|
|
|
|
Value: s.V,
|
|
|
|
})
|
|
|
|
}
|
|
|
|
c.wg.Add(len(ss))
|
|
|
|
}
|
2017-05-10 02:44:13 -07:00
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func (c *TestStorageClient) waitForExpectedSamples(t *testing.T) {
|
|
|
|
c.wg.Wait()
|
|
|
|
c.mtx.Lock()
|
|
|
|
defer c.mtx.Unlock()
|
|
|
|
for ts, expectedSamples := range c.expectedSamples {
|
|
|
|
if !reflect.DeepEqual(expectedSamples, c.receivedSamples[ts]) {
|
|
|
|
t.Fatalf("%s: Expected %v, got %v", ts, expectedSamples, c.receivedSamples[ts])
|
|
|
|
}
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
2018-09-07 14:26:04 -07:00
|
|
|
}
|
2017-05-10 02:44:13 -07:00
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func (c *TestStorageClient) Store(_ context.Context, req []byte) error {
|
|
|
|
c.mtx.Lock()
|
|
|
|
defer c.mtx.Unlock()
|
|
|
|
reqBuf, err := snappy.Decode(nil, req)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
var reqProto prompb.WriteRequest
|
|
|
|
if err := proto.Unmarshal(reqBuf, &reqProto); err != nil {
|
|
|
|
return err
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
count := 0
|
|
|
|
for _, ts := range reqProto.Timeseries {
|
|
|
|
var seriesName string
|
|
|
|
labels := labelProtosToLabels(ts.Labels)
|
|
|
|
for _, label := range labels {
|
|
|
|
if label.Name == "__name__" {
|
|
|
|
seriesName = label.Value
|
|
|
|
}
|
|
|
|
}
|
|
|
|
for _, sample := range ts.Samples {
|
|
|
|
count++
|
|
|
|
c.receivedSamples[seriesName] = append(c.receivedSamples[seriesName], sample)
|
|
|
|
}
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
2018-09-07 14:26:04 -07:00
|
|
|
c.wg.Add(-count)
|
|
|
|
return nil
|
2017-05-10 02:44:13 -07:00
|
|
|
}
|
2018-05-29 01:51:29 -07:00
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
func (c *TestStorageClient) Name() string {
|
|
|
|
return "teststorageclient"
|
|
|
|
}
|
2018-05-29 01:51:29 -07:00
|
|
|
|
2018-09-07 14:26:04 -07:00
|
|
|
// TestBlockingStorageClient is a queue_manager StorageClient which will block
|
|
|
|
// on any calls to Store(), until the request's Context is cancelled, at which
|
|
|
|
// point the `numCalls` property will contain a count of how many times Store()
|
|
|
|
// was called.
|
|
|
|
type TestBlockingStorageClient struct {
|
|
|
|
numCalls uint64
|
|
|
|
}
|
|
|
|
|
|
|
|
func NewTestBlockedStorageClient() *TestBlockingStorageClient {
|
|
|
|
return &TestBlockingStorageClient{}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *TestBlockingStorageClient) Store(ctx context.Context, _ []byte) error {
|
|
|
|
atomic.AddUint64(&c.numCalls, 1)
|
|
|
|
<-ctx.Done()
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *TestBlockingStorageClient) NumCalls() uint64 {
|
|
|
|
return atomic.LoadUint64(&c.numCalls)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (c *TestBlockingStorageClient) Name() string {
|
|
|
|
return "testblockingstorageclient"
|
2018-05-29 01:51:29 -07:00
|
|
|
}
|