mirror of
https://github.com/prometheus/prometheus.git
synced 2025-01-11 05:47:27 -08:00
Reduce chunk write queue memory usage (#10873)
* dont waste space on the chunkRefMap * add time factor * add comments * better readability * add instrumentation and more comments * formatting * uppercase comments * Address review feedback. Renamed "free" to "shrink" everywhere, updated comments and threshold to 1000. * double space Signed-off-by: Mauro Stettler <mauro.stettler@gmail.com> Co-authored-by: Peter Štibraný <pstibrany@gmail.com> Co-authored-by: Mauro Stettler <mauro.stettler@gmail.com>
This commit is contained in:
parent
9f77d23889
commit
03a2313f7a
|
@ -16,12 +16,21 @@ package chunks
|
||||||
import (
|
import (
|
||||||
"errors"
|
"errors"
|
||||||
"sync"
|
"sync"
|
||||||
|
"time"
|
||||||
|
|
||||||
"github.com/prometheus/client_golang/prometheus"
|
"github.com/prometheus/client_golang/prometheus"
|
||||||
|
|
||||||
"github.com/prometheus/prometheus/tsdb/chunkenc"
|
"github.com/prometheus/prometheus/tsdb/chunkenc"
|
||||||
)
|
)
|
||||||
|
|
||||||
|
const (
|
||||||
|
// Minimum recorded peak since since the last shrinking of chunkWriteQueue.chunkrefMap to shrink it again.
|
||||||
|
chunkRefMapShrinkThreshold = 1000
|
||||||
|
|
||||||
|
// Minimum interval between shrinking of chunkWriteQueue.chunkRefMap.
|
||||||
|
chunkRefMapMinShrinkInterval = 10 * time.Minute
|
||||||
|
)
|
||||||
|
|
||||||
type chunkWriteJob struct {
|
type chunkWriteJob struct {
|
||||||
cutFile bool
|
cutFile bool
|
||||||
seriesRef HeadSeriesRef
|
seriesRef HeadSeriesRef
|
||||||
|
@ -38,21 +47,28 @@ type chunkWriteJob struct {
|
||||||
type chunkWriteQueue struct {
|
type chunkWriteQueue struct {
|
||||||
jobs chan chunkWriteJob
|
jobs chan chunkWriteJob
|
||||||
|
|
||||||
chunkRefMapMtx sync.RWMutex
|
chunkRefMapMtx sync.RWMutex
|
||||||
chunkRefMap map[ChunkDiskMapperRef]chunkenc.Chunk
|
chunkRefMap map[ChunkDiskMapperRef]chunkenc.Chunk
|
||||||
|
chunkRefMapPeakSize int // Largest size that chunkRefMap has grown to since the last time we shrank it.
|
||||||
|
chunkRefMapLastShrink time.Time // When the chunkRefMap has been shrunk the last time.
|
||||||
|
|
||||||
isRunningMtx sync.Mutex // Protects the isRunning property.
|
// isRunningMtx serves two purposes:
|
||||||
isRunning bool // Used to prevent that new jobs get added to the queue when the chan is already closed.
|
// 1. It protects isRunning field.
|
||||||
|
// 2. It serializes adding of jobs to the chunkRefMap in addJob() method. If jobs channel is full then addJob() will block
|
||||||
|
// while holding this mutex, which guarantees that chunkRefMap won't ever grow beyond the queue size + 1.
|
||||||
|
isRunningMtx sync.Mutex
|
||||||
|
isRunning bool // Used to prevent that new jobs get added to the queue when the chan is already closed.
|
||||||
|
|
||||||
workerWg sync.WaitGroup
|
workerWg sync.WaitGroup
|
||||||
|
|
||||||
writeChunk writeChunkF
|
writeChunk writeChunkF
|
||||||
|
|
||||||
// Keeping three separate counters instead of only a single CounterVec to improve the performance of the critical
|
// Keeping separate counters instead of only a single CounterVec to improve the performance of the critical
|
||||||
// addJob() method which otherwise would need to perform a WithLabelValues call on the CounterVec.
|
// addJob() method which otherwise would need to perform a WithLabelValues call on the CounterVec.
|
||||||
adds prometheus.Counter
|
adds prometheus.Counter
|
||||||
gets prometheus.Counter
|
gets prometheus.Counter
|
||||||
completed prometheus.Counter
|
completed prometheus.Counter
|
||||||
|
shrink prometheus.Counter
|
||||||
}
|
}
|
||||||
|
|
||||||
// writeChunkF is a function which writes chunks, it is dynamic to allow mocking in tests.
|
// writeChunkF is a function which writes chunks, it is dynamic to allow mocking in tests.
|
||||||
|
@ -68,13 +84,15 @@ func newChunkWriteQueue(reg prometheus.Registerer, size int, writeChunk writeChu
|
||||||
)
|
)
|
||||||
|
|
||||||
q := &chunkWriteQueue{
|
q := &chunkWriteQueue{
|
||||||
jobs: make(chan chunkWriteJob, size),
|
jobs: make(chan chunkWriteJob, size),
|
||||||
chunkRefMap: make(map[ChunkDiskMapperRef]chunkenc.Chunk, size),
|
chunkRefMap: make(map[ChunkDiskMapperRef]chunkenc.Chunk),
|
||||||
writeChunk: writeChunk,
|
chunkRefMapLastShrink: time.Now(),
|
||||||
|
writeChunk: writeChunk,
|
||||||
|
|
||||||
adds: counters.WithLabelValues("add"),
|
adds: counters.WithLabelValues("add"),
|
||||||
gets: counters.WithLabelValues("get"),
|
gets: counters.WithLabelValues("get"),
|
||||||
completed: counters.WithLabelValues("complete"),
|
completed: counters.WithLabelValues("complete"),
|
||||||
|
shrink: counters.WithLabelValues("shrink"),
|
||||||
}
|
}
|
||||||
|
|
||||||
if reg != nil {
|
if reg != nil {
|
||||||
|
@ -112,6 +130,42 @@ func (c *chunkWriteQueue) processJob(job chunkWriteJob) {
|
||||||
delete(c.chunkRefMap, job.ref)
|
delete(c.chunkRefMap, job.ref)
|
||||||
|
|
||||||
c.completed.Inc()
|
c.completed.Inc()
|
||||||
|
|
||||||
|
c.shrinkChunkRefMap()
|
||||||
|
}
|
||||||
|
|
||||||
|
// shrinkChunkRefMap checks whether the conditions to shrink the chunkRefMap are met,
|
||||||
|
// if so chunkRefMap is reinitialized. The chunkRefMapMtx must be held when calling this method.
|
||||||
|
//
|
||||||
|
// We do this because Go runtime doesn't release internal memory used by map after map has been emptied.
|
||||||
|
// To achieve that we create new map instead and throw the old one away.
|
||||||
|
func (c *chunkWriteQueue) shrinkChunkRefMap() {
|
||||||
|
if len(c.chunkRefMap) > 0 {
|
||||||
|
// Can't shrink it while there is data in it.
|
||||||
|
return
|
||||||
|
}
|
||||||
|
|
||||||
|
if c.chunkRefMapPeakSize < chunkRefMapShrinkThreshold {
|
||||||
|
// Not shrinking it because it has not grown to the minimum threshold yet.
|
||||||
|
return
|
||||||
|
}
|
||||||
|
|
||||||
|
now := time.Now()
|
||||||
|
|
||||||
|
if now.Sub(c.chunkRefMapLastShrink) < chunkRefMapMinShrinkInterval {
|
||||||
|
// Not shrinking it because the minimum duration between shrink-events has not passed yet.
|
||||||
|
return
|
||||||
|
}
|
||||||
|
|
||||||
|
// Re-initialize the chunk ref map to half of the peak size that it has grown to since the last re-init event.
|
||||||
|
// We are trying to hit the sweet spot in the trade-off between initializing it to a very small size
|
||||||
|
// potentially resulting in many allocations to re-grow it, and initializing it to a large size potentially
|
||||||
|
// resulting in unused allocated memory.
|
||||||
|
c.chunkRefMap = make(map[ChunkDiskMapperRef]chunkenc.Chunk, c.chunkRefMapPeakSize/2)
|
||||||
|
|
||||||
|
c.chunkRefMapPeakSize = 0
|
||||||
|
c.chunkRefMapLastShrink = now
|
||||||
|
c.shrink.Inc()
|
||||||
}
|
}
|
||||||
|
|
||||||
func (c *chunkWriteQueue) addJob(job chunkWriteJob) (err error) {
|
func (c *chunkWriteQueue) addJob(job chunkWriteJob) (err error) {
|
||||||
|
@ -125,11 +179,16 @@ func (c *chunkWriteQueue) addJob(job chunkWriteJob) (err error) {
|
||||||
defer c.isRunningMtx.Unlock()
|
defer c.isRunningMtx.Unlock()
|
||||||
|
|
||||||
if !c.isRunning {
|
if !c.isRunning {
|
||||||
return errors.New("queue is not started")
|
return errors.New("queue is not running")
|
||||||
}
|
}
|
||||||
|
|
||||||
c.chunkRefMapMtx.Lock()
|
c.chunkRefMapMtx.Lock()
|
||||||
c.chunkRefMap[job.ref] = job.chk
|
c.chunkRefMap[job.ref] = job.chk
|
||||||
|
|
||||||
|
// Keep track of the peak usage of c.chunkRefMap.
|
||||||
|
if len(c.chunkRefMap) > c.chunkRefMapPeakSize {
|
||||||
|
c.chunkRefMapPeakSize = len(c.chunkRefMap)
|
||||||
|
}
|
||||||
c.chunkRefMapMtx.Unlock()
|
c.chunkRefMapMtx.Unlock()
|
||||||
|
|
||||||
c.jobs <- job
|
c.jobs <- job
|
||||||
|
|
Loading…
Reference in a new issue