mirror of
https://github.com/prometheus/prometheus.git
synced 2024-12-24 21:24:05 -08:00
fada85a83c
This is based on my experience while debugging https://github.com/prometheus/prometheus/issues/3943. I needed to deduct few things, and all that would be just bit easier with these two logs: - new block's ULID on each compaction. - actual list of Blocks (ulid + time range) on Prometheus startup (easy to log that while repairing blocks). We don't really need blocks that takes part in compaction - that can be deducted easily based on time ranges of blocks we have currently in system. What do you think? Signed-off-by: Bartek Plotka <bwplotka@gmail.com>
105 lines
2.4 KiB
Go
105 lines
2.4 KiB
Go
package tsdb
|
|
|
|
import (
|
|
"encoding/json"
|
|
"io"
|
|
"io/ioutil"
|
|
"os"
|
|
"path"
|
|
"path/filepath"
|
|
|
|
"github.com/go-kit/kit/log"
|
|
"github.com/go-kit/kit/log/level"
|
|
"github.com/oklog/ulid"
|
|
"github.com/pkg/errors"
|
|
"github.com/prometheus/tsdb/fileutil"
|
|
)
|
|
|
|
// repairBadIndexVersion repairs an issue in index and meta.json persistence introduced in
|
|
// commit 129773b41a565fde5156301e37f9a87158030443.
|
|
func repairBadIndexVersion(logger log.Logger, dir string) error {
|
|
// All blocks written by Prometheus 2.1 with a meta.json version of 2 are affected.
|
|
// We must actually set the index file version to 2 and revert the meta.json version back to 1.
|
|
subdirs, err := fileutil.ReadDir(dir)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
for _, d := range subdirs {
|
|
// Skip non-block dirs.
|
|
if _, err := ulid.Parse(d); err != nil {
|
|
continue
|
|
}
|
|
d = path.Join(dir, d)
|
|
|
|
meta, err := readBogusMetaFile(d)
|
|
if err != nil {
|
|
return err
|
|
}
|
|
if meta.Version == 1 {
|
|
level.Info(logger).Log(
|
|
"msg", "found healthy block",
|
|
"mint", meta.MinTime,
|
|
"maxt", meta.MaxTime,
|
|
"ulid", meta.ULID,
|
|
)
|
|
continue
|
|
}
|
|
level.Info(logger).Log(
|
|
"msg", "fixing broken block",
|
|
"mint", meta.MinTime,
|
|
"maxt", meta.MaxTime,
|
|
"ulid", meta.ULID,
|
|
)
|
|
|
|
repl, err := os.Create(filepath.Join(d, "index.repaired"))
|
|
if err != nil {
|
|
return err
|
|
}
|
|
broken, err := os.Open(filepath.Join(d, "index"))
|
|
if err != nil {
|
|
return err
|
|
}
|
|
if _, err := io.Copy(repl, broken); err != nil {
|
|
return err
|
|
}
|
|
// Set the 5th byte to 2 to indiciate the correct file format version.
|
|
if _, err := repl.WriteAt([]byte{2}, 4); err != nil {
|
|
return err
|
|
}
|
|
if err := fileutil.Fsync(repl); err != nil {
|
|
return err
|
|
}
|
|
if err := repl.Close(); err != nil {
|
|
return err
|
|
}
|
|
if err := broken.Close(); err != nil {
|
|
return err
|
|
}
|
|
if err := renameFile(repl.Name(), broken.Name()); err != nil {
|
|
return err
|
|
}
|
|
// Reset version of meta.json to 1.
|
|
meta.Version = 1
|
|
if err := writeMetaFile(d, meta); err != nil {
|
|
return err
|
|
}
|
|
}
|
|
return nil
|
|
}
|
|
|
|
func readBogusMetaFile(dir string) (*BlockMeta, error) {
|
|
b, err := ioutil.ReadFile(filepath.Join(dir, metaFilename))
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
var m BlockMeta
|
|
|
|
if err := json.Unmarshal(b, &m); err != nil {
|
|
return nil, err
|
|
}
|
|
if m.Version != 1 && m.Version != 2 {
|
|
return nil, errors.Errorf("unexpected meta file version %d", m.Version)
|
|
}
|
|
return &m, nil
|
|
}
|