prometheus/compact.go

425 lines
8.5 KiB
Go
Raw Normal View History

package tsdb
import (
"os"
2017-01-02 05:41:13 -08:00
"path/filepath"
2017-01-03 06:43:26 -08:00
"time"
2017-01-02 05:41:13 -08:00
"github.com/coreos/etcd/pkg/fileutil"
"github.com/fabxc/tsdb/labels"
2017-01-03 06:43:26 -08:00
"github.com/pkg/errors"
"github.com/prometheus/client_golang/prometheus"
)
type compactor struct {
2017-01-03 06:43:26 -08:00
metrics *compactorMetrics
blocks compactableBlocks
}
2017-01-03 06:43:26 -08:00
type compactorMetrics struct {
ran prometheus.Counter
failed prometheus.Counter
duration prometheus.Histogram
2017-01-03 06:43:26 -08:00
}
func newCompactorMetrics(r prometheus.Registerer) *compactorMetrics {
2017-01-03 06:43:26 -08:00
m := &compactorMetrics{}
m.ran = prometheus.NewCounter(prometheus.CounterOpts{
Name: "tsdb_compactions_total",
Help: "Total number of compactions that were executed for the partition.",
2017-01-03 06:43:26 -08:00
})
m.failed = prometheus.NewCounter(prometheus.CounterOpts{
Name: "tsdb_compactions_failed_total",
Help: "Total number of compactions that failed for the partition.",
2017-01-03 06:43:26 -08:00
})
m.duration = prometheus.NewHistogram(prometheus.HistogramOpts{
Name: "tsdb_compaction_duration",
Help: "Duration of compaction runs.",
2017-01-03 06:43:26 -08:00
})
if r != nil {
r.MustRegister(
m.ran,
m.failed,
m.duration,
)
}
2017-01-03 06:43:26 -08:00
return m
}
type blockStore interface {
blocks() []Block
}
2017-01-03 01:09:20 -08:00
type compactableBlocks interface {
compactable() []Block
2017-01-03 01:09:20 -08:00
}
2017-01-09 10:14:21 -08:00
func newCompactor(blocks compactableBlocks, r prometheus.Registerer) (*compactor, error) {
c := &compactor{
blocks: blocks,
2017-01-09 10:14:21 -08:00
metrics: newCompactorMetrics(r),
}
return c, nil
}
const (
compactionMaxSize = 1 << 30 // 1GB
compactionBlocks = 2
)
func (c *compactor) pick() []Block {
2017-01-03 06:43:26 -08:00
bs := c.blocks.compactable()
if len(bs) == 0 {
return nil
}
if len(bs) == 1 && !bs[0].Persisted() {
return bs
2017-01-03 06:43:26 -08:00
}
if !bs[0].Persisted() {
if len(bs) == 2 || !compactionMatch(bs[:3]) {
return bs[:1]
}
}
2017-01-03 06:43:26 -08:00
for i := 0; i+2 < len(bs); i += 3 {
tpl := bs[i : i+3]
if compactionMatch(tpl) {
return tpl
2017-01-03 06:43:26 -08:00
}
}
return nil
}
func compactionMatch(blocks []Block) bool {
// TODO(fabxc): check whether combined size is below maxCompactionSize.
// Apply maximum time range? or number of series? might already be covered by size implicitly.
2017-01-03 06:43:26 -08:00
// Naively check whether both blocks have roughly the same number of samples
// and whether the total sample count doesn't exceed 2GB chunk file size
// by rough approximation.
n := float64(blocks[0].Stats().SampleCount)
t := n
for _, b := range blocks[1:] {
m := float64(b.Stats().SampleCount)
if m < 0.8*n || m > 1.2*n {
return false
}
t += m
}
// Pessimistic 10 bytes/sample should do.
return t < 10*200e6
2017-01-03 01:09:20 -08:00
}
func mergeStats(blocks ...Block) (res BlockStats) {
res.MinTime = blocks[0].Stats().MinTime
res.MaxTime = blocks[len(blocks)-1].Stats().MaxTime
2017-01-03 06:43:26 -08:00
for _, b := range blocks {
res.SampleCount += b.Stats().SampleCount
}
2017-01-03 06:43:26 -08:00
return res
}
func (c *compactor) compact(dir string, blocks ...Block) (err error) {
start := time.Now()
defer func() {
if err != nil {
c.metrics.failed.Inc()
}
c.metrics.duration.Observe(time.Since(start).Seconds())
}()
2017-01-03 06:43:26 -08:00
// Write to temporary directory to make persistence appear atomic.
if fileutil.Exist(dir) {
if err = os.RemoveAll(dir); err != nil {
2017-01-03 06:43:26 -08:00
return err
}
}
if err = fileutil.CreateDirAll(dir); err != nil {
return err
}
chunkf, err := fileutil.LockFile(chunksFileName(dir), os.O_WRONLY|os.O_CREATE, 0666)
if err != nil {
2017-01-03 06:43:26 -08:00
return errors.Wrap(err, "create chunk file")
}
indexf, err := fileutil.LockFile(indexFileName(dir), os.O_WRONLY|os.O_CREATE, 0666)
if err != nil {
2017-01-03 06:43:26 -08:00
return errors.Wrap(err, "create index file")
}
indexw := newIndexWriter(indexf)
chunkw := newSeriesWriter(chunkf, indexw)
if err = c.write(blocks, indexw, chunkw); err != nil {
2017-01-03 06:43:26 -08:00
return errors.Wrap(err, "write compaction")
}
if err = chunkw.Close(); err != nil {
2017-01-03 06:43:26 -08:00
return errors.Wrap(err, "close chunk writer")
}
if err = indexw.Close(); err != nil {
2017-01-03 06:43:26 -08:00
return errors.Wrap(err, "close index writer")
}
if err = fileutil.Fsync(chunkf.File); err != nil {
2017-01-03 06:43:26 -08:00
return errors.Wrap(err, "fsync chunk file")
}
if err = fileutil.Fsync(indexf.File); err != nil {
2017-01-03 06:43:26 -08:00
return errors.Wrap(err, "fsync index file")
}
if err = chunkf.Close(); err != nil {
2017-01-03 06:43:26 -08:00
return errors.Wrap(err, "close chunk file")
}
if err = indexf.Close(); err != nil {
2017-01-03 06:43:26 -08:00
return errors.Wrap(err, "close index file")
}
return nil
2017-01-03 06:43:26 -08:00
}
func (c *compactor) write(blocks []Block, indexw IndexWriter, chunkw SeriesWriter) error {
2017-01-03 06:43:26 -08:00
var set compactionSet
for i, b := range blocks {
all, err := b.Index().Postings("", "")
2017-01-03 06:43:26 -08:00
if err != nil {
return err
}
// TODO(fabxc): find more transparent way of handling this.
if hb, ok := b.(*headBlock); ok {
all = hb.remapPostings(all)
}
s := newCompactionSeriesSet(b.Index(), b.Series(), all)
2017-01-03 06:43:26 -08:00
if i == 0 {
set = s
continue
}
set, err = newCompactionMerger(set, s)
if err != nil {
return err
}
}
// We fully rebuild the postings list index from merged series.
var (
postings = &memPostings{m: make(map[term][]uint32, 512)}
values = map[string]stringset{}
i = uint32(0)
2017-01-03 06:43:26 -08:00
stats = mergeStats(blocks...)
)
for set.Next() {
lset, chunks := set.At()
2017-01-02 07:58:47 -08:00
if err := chunkw.WriteSeries(i, lset, chunks); err != nil {
return err
}
2017-01-07 09:02:17 -08:00
stats.ChunkCount += uint64(len(chunks))
stats.SeriesCount++
for _, l := range lset {
valset, ok := values[l.Name]
if !ok {
valset = stringset{}
values[l.Name] = valset
}
valset.set(l.Value)
postings.add(i, term{name: l.Name, value: l.Value})
}
i++
}
if set.Err() != nil {
return set.Err()
}
2017-01-02 07:58:47 -08:00
if err := indexw.WriteStats(stats); err != nil {
return err
}
s := make([]string, 0, 256)
for n, v := range values {
s = s[:0]
for x := range v {
s = append(s, x)
}
2017-01-02 07:58:47 -08:00
if err := indexw.WriteLabelIndex([]string{n}, s); err != nil {
return err
}
}
for t := range postings.m {
2017-01-02 07:58:47 -08:00
if err := indexw.WritePostings(t.name, t.value, postings.get(t)); err != nil {
return err
}
}
// Write a postings list containing all series.
all := make([]uint32, i)
for i := range all {
all[i] = uint32(i)
}
2017-01-02 07:58:47 -08:00
if err := indexw.WritePostings("", "", newListPostings(all)); err != nil {
return err
}
return nil
}
2017-01-03 06:43:26 -08:00
type compactionSet interface {
Next() bool
At() (labels.Labels, []ChunkMeta)
Err() error
}
type compactionSeriesSet struct {
p Postings
index IndexReader
series SeriesReader
l labels.Labels
c []ChunkMeta
err error
}
func newCompactionSeriesSet(i IndexReader, s SeriesReader, p Postings) *compactionSeriesSet {
return &compactionSeriesSet{
index: i,
series: s,
p: p,
}
}
func (c *compactionSeriesSet) Next() bool {
if !c.p.Next() {
return false
}
2017-01-02 04:27:52 -08:00
c.l, c.c, c.err = c.index.Series(c.p.At())
if c.err != nil {
return false
}
for i := range c.c {
chk := &c.c[i]
chk.Chunk, c.err = c.series.Chunk(chk.Ref)
if c.err != nil {
return false
}
}
return true
}
func (c *compactionSeriesSet) Err() error {
if c.err != nil {
return c.err
}
return c.p.Err()
}
func (c *compactionSeriesSet) At() (labels.Labels, []ChunkMeta) {
return c.l, c.c
}
type compactionMerger struct {
2017-01-03 06:43:26 -08:00
a, b compactionSet
aok, bok bool
l labels.Labels
c []ChunkMeta
}
type compactionSeries struct {
labels labels.Labels
chunks []ChunkMeta
}
2017-01-03 06:43:26 -08:00
func newCompactionMerger(a, b compactionSet) (*compactionMerger, error) {
c := &compactionMerger{
a: a,
b: b,
}
// Initialize first elements of both sets as Next() needs
// one element look-ahead.
c.aok = c.a.Next()
c.bok = c.b.Next()
return c, c.Err()
}
func (c *compactionMerger) compare() int {
if !c.aok {
return 1
}
if !c.bok {
return -1
}
a, _ := c.a.At()
b, _ := c.b.At()
return labels.Compare(a, b)
}
func (c *compactionMerger) Next() bool {
if !c.aok && !c.bok || c.Err() != nil {
return false
}
d := c.compare()
// Both sets contain the current series. Chain them into a single one.
if d > 0 {
c.l, c.c = c.b.At()
c.bok = c.b.Next()
} else if d < 0 {
c.l, c.c = c.a.At()
c.aok = c.a.Next()
} else {
l, ca := c.a.At()
_, cb := c.b.At()
c.l = l
c.c = append(ca, cb...)
c.aok = c.a.Next()
c.bok = c.b.Next()
}
return true
}
func (c *compactionMerger) Err() error {
if c.a.Err() != nil {
return c.a.Err()
}
return c.b.Err()
}
func (c *compactionMerger) At() (labels.Labels, []ChunkMeta) {
return c.l, c.c
}
2017-01-02 05:41:13 -08:00
func renameDir(from, to string) error {
if err := os.RemoveAll(to); err != nil {
return err
}
if err := os.Rename(from, to); err != nil {
return err
}
// Directory was renamed; sync parent dir to persist rename.
pdir, err := fileutil.OpenDir(filepath.Dir(to))
if err != nil {
return err
}
if err = fileutil.Fsync(pdir); err != nil {
return err
}
if err = pdir.Close(); err != nil {
return err
}
return nil
}