Remote Write: Add max samples per metadata send (#8959)

* Added MaxSamplesPerSend

Signed-off-by: Levi Harrison <git@leviharrison.dev>

* Added tests

Signed-off-by: Levi Harrison <git@leviharrison.dev>

* Fixed order of require

Signed-off-by: Levi Harrison <git@leviharrison.dev>

* Added docs

Signed-off-by: Levi Harrison <git@leviharrison.dev>

* writes -> writesReceived

Signed-off-by: Levi Harrison <git@leviharrison.dev>

* Improved send loop

Signed-off-by: Levi Harrison <git@leviharrison.dev>
This commit is contained in:
Levi Harrison 2021-06-24 18:39:50 -04:00 committed by GitHub
parent 7cb55d5732
commit d5c3c567d3
No known key found for this signature in database
GPG key ID: 4AEE18F83AFDEB23
4 changed files with 36 additions and 13 deletions

View file

@ -173,8 +173,9 @@ var (
// DefaultMetadataConfig is the default metadata configuration for a remote write endpoint. // DefaultMetadataConfig is the default metadata configuration for a remote write endpoint.
DefaultMetadataConfig = MetadataConfig{ DefaultMetadataConfig = MetadataConfig{
Send: true, Send: true,
SendInterval: model.Duration(1 * time.Minute), SendInterval: model.Duration(1 * time.Minute),
MaxSamplesPerSend: 500,
} }
// DefaultRemoteReadConfig is the default remote read configuration. // DefaultRemoteReadConfig is the default remote read configuration.
@ -731,6 +732,8 @@ type MetadataConfig struct {
Send bool `yaml:"send"` Send bool `yaml:"send"`
// SendInterval controls how frequently we send metric metadata. // SendInterval controls how frequently we send metric metadata.
SendInterval model.Duration `yaml:"send_interval"` SendInterval model.Duration `yaml:"send_interval"`
// Maximum number of samples per send.
MaxSamplesPerSend int `yaml:"max_samples_per_send,omitempty"`
} }
// SigV4Config is the configuration for signing remote write requests with // SigV4Config is the configuration for signing remote write requests with

View file

@ -2443,6 +2443,8 @@ metadata_config:
[ send: <boolean> | default = true ] [ send: <boolean> | default = true ]
# How frequently metric metadata is sent to remote storage. # How frequently metric metadata is sent to remote storage.
[ send_interval: <duration> | default = 1m ] [ send_interval: <duration> | default = 1m ]
# Maximum number of samples per send.
[ max_samples_per_send: <int> | default = 500]
``` ```
There is a list of There is a list of

View file

@ -443,11 +443,17 @@ func (t *QueueManager) AppendMetadata(ctx context.Context, metadata []scrape.Met
}) })
} }
err := t.sendMetadataWithBackoff(ctx, mm) numSends := int(math.Ceil(float64(len(metadata)) / float64(t.mcfg.MaxSamplesPerSend)))
for i := 0; i < numSends; i++ {
if err != nil { last := (i + 1) * t.mcfg.MaxSamplesPerSend
t.metrics.failedMetadataTotal.Add(float64(len(metadata))) if last > len(metadata) {
level.Error(t.logger).Log("msg", "non-recoverable error while sending metadata", "count", len(metadata), "err", err) last = len(metadata)
}
err := t.sendMetadataWithBackoff(ctx, mm[i*t.mcfg.MaxSamplesPerSend:last])
if err != nil {
t.metrics.failedMetadataTotal.Add(float64(last - (i * t.mcfg.MaxSamplesPerSend)))
level.Error(t.logger).Log("msg", "non-recoverable error while sending metadata", "count", last-(i*t.mcfg.MaxSamplesPerSend), "err", err)
}
} }
} }

View file

@ -167,16 +167,25 @@ func TestMetadataDelivery(t *testing.T) {
m.Start() m.Start()
defer m.Stop() defer m.Stop()
m.AppendMetadata(context.Background(), []scrape.MetricMetadata{ metadata := []scrape.MetricMetadata{}
{ numMetadata := 1532
Metric: "prometheus_remote_storage_sent_metadata_bytes_total", for i := 0; i < numMetadata; i++ {
metadata = append(metadata, scrape.MetricMetadata{
Metric: "prometheus_remote_storage_sent_metadata_bytes_total_" + strconv.Itoa(i),
Type: textparse.MetricTypeCounter, Type: textparse.MetricTypeCounter,
Help: "a nice help text", Help: "a nice help text",
Unit: "", Unit: "",
}, })
}) }
require.Equal(t, len(c.receivedMetadata), 1) m.AppendMetadata(context.Background(), metadata)
require.Equal(t, numMetadata, len(c.receivedMetadata))
// One more write than the rounded qoutient should be performed in order to get samples that didn't
// fit into MaxSamplesPerSend.
require.Equal(t, numMetadata/mcfg.MaxSamplesPerSend+1, c.writesReceived)
// Make sure the last samples were sent.
require.Equal(t, c.receivedMetadata[metadata[len(metadata)-1].Metric][0].MetricFamilyName, metadata[len(metadata)-1].Metric)
} }
func TestSampleDeliveryTimeout(t *testing.T) { func TestSampleDeliveryTimeout(t *testing.T) {
@ -522,6 +531,7 @@ type TestWriteClient struct {
receivedExemplars map[string][]prompb.Exemplar receivedExemplars map[string][]prompb.Exemplar
expectedExemplars map[string][]prompb.Exemplar expectedExemplars map[string][]prompb.Exemplar
receivedMetadata map[string][]prompb.MetricMetadata receivedMetadata map[string][]prompb.MetricMetadata
writesReceived int
withWaitGroup bool withWaitGroup bool
wg sync.WaitGroup wg sync.WaitGroup
mtx sync.Mutex mtx sync.Mutex
@ -655,6 +665,8 @@ func (c *TestWriteClient) Store(_ context.Context, req []byte) error {
c.receivedMetadata[m.MetricFamilyName] = append(c.receivedMetadata[m.MetricFamilyName], m) c.receivedMetadata[m.MetricFamilyName] = append(c.receivedMetadata[m.MetricFamilyName], m)
} }
c.writesReceived++
return nil return nil
} }