prometheus/tsdb/repair.go

131 lines
4.1 KiB
Go
Raw Permalink Normal View History

// Copyright 2018 The Prometheus Authors
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
2018-02-09 04:11:03 -08:00
package tsdb
import (
"encoding/json"
"io"
"os"
"path/filepath"
"github.com/go-kit/log"
"github.com/go-kit/log/level"
2018-02-09 04:11:03 -08:00
"github.com/pkg/errors"
tsdb_errors "github.com/prometheus/prometheus/tsdb/errors"
"github.com/prometheus/prometheus/tsdb/fileutil"
2018-02-09 04:11:03 -08:00
)
// repairBadIndexVersion repairs an issue in index and meta.json persistence introduced in
// commit 129773b41a565fde5156301e37f9a87158030443.
2018-02-09 04:11:03 -08:00
func repairBadIndexVersion(logger log.Logger, dir string) error {
// All blocks written by Prometheus 2.1 with a meta.json version of 2 are affected.
// We must actually set the index file version to 2 and revert the meta.json version back to 1.
dirs, err := blockDirs(dir)
2018-02-09 04:11:03 -08:00
if err != nil {
return errors.Wrapf(err, "list block dirs in %q", dir)
2018-02-09 04:11:03 -08:00
}
tmpFiles := make([]string, 0, len(dirs))
defer func() {
for _, tmp := range tmpFiles {
if err := os.RemoveAll(tmp); err != nil {
level.Error(logger).Log("msg", "remove tmp file", "err", err.Error())
}
}
}()
for _, d := range dirs {
2018-02-09 04:11:03 -08:00
meta, err := readBogusMetaFile(d)
if err != nil {
level.Error(logger).Log("msg", "failed to read meta.json for a block during repair process; skipping", "dir", d, "err", err)
continue
2018-02-09 04:11:03 -08:00
}
if meta.Version == metaVersion1 {
level.Info(logger).Log(
"msg", "Found healthy block",
"mint", meta.MinTime,
"maxt", meta.MaxTime,
"ulid", meta.ULID,
)
2018-02-09 04:11:03 -08:00
continue
}
level.Info(logger).Log(
"msg", "Fixing broken block",
"mint", meta.MinTime,
"maxt", meta.MaxTime,
"ulid", meta.ULID,
)
2018-02-09 04:11:03 -08:00
repl, err := os.Create(filepath.Join(d, "index.repaired"))
if err != nil {
return errors.Wrapf(err, "create index.repaired for block dir: %v", d)
2018-02-09 04:11:03 -08:00
}
tmpFiles = append(tmpFiles, repl.Name())
broken, err := os.Open(filepath.Join(d, indexFilename))
2018-02-09 04:11:03 -08:00
if err != nil {
return errors.Wrapf(err, "open broken index for block dir: %v", d)
2018-02-09 04:11:03 -08:00
}
if _, err := io.Copy(repl, broken); err != nil {
return errors.Wrapf(err, "copy content of index to index.repaired for block dir: %v", d)
2018-02-09 04:11:03 -08:00
}
// Set the 5th byte to 2 to indicate the correct file format version.
2018-02-09 04:11:03 -08:00
if _, err := repl.WriteAt([]byte{2}, 4); err != nil {
return tsdb_errors.NewMulti(
errors.Wrapf(err, "rewrite of index.repaired for block dir: %v", d),
errors.Wrap(repl.Close(), "close"),
).Err()
2018-02-09 04:11:03 -08:00
}
if err := repl.Sync(); err != nil {
return tsdb_errors.NewMulti(
errors.Wrapf(err, "sync of index.repaired for block dir: %v", d),
errors.Wrap(repl.Close(), "close"),
).Err()
2018-02-09 04:11:03 -08:00
}
if err := repl.Close(); err != nil {
return errors.Wrapf(repl.Close(), "close repaired index for block dir: %v", d)
2018-02-09 04:11:03 -08:00
}
if err := broken.Close(); err != nil {
return errors.Wrapf(repl.Close(), "close broken index for block dir: %v", d)
}
if err := fileutil.Replace(repl.Name(), broken.Name()); err != nil {
return errors.Wrapf(repl.Close(), "replaced broken index with index.repaired for block dir: %v", d)
2018-02-09 04:11:03 -08:00
}
// Reset version of meta.json to 1.
meta.Version = metaVersion1
if _, err := writeMetaFile(logger, d, meta); err != nil {
return errors.Wrapf(repl.Close(), "write meta for block dir: %v", d)
2018-02-09 04:11:03 -08:00
}
}
return nil
}
func readBogusMetaFile(dir string) (*BlockMeta, error) {
b, err := os.ReadFile(filepath.Join(dir, metaFilename))
2018-02-09 04:11:03 -08:00
if err != nil {
return nil, err
}
var m BlockMeta
if err := json.Unmarshal(b, &m); err != nil {
return nil, err
}
if m.Version != metaVersion1 && m.Version != 2 {
2018-02-09 04:11:03 -08:00
return nil, errors.Errorf("unexpected meta file version %d", m.Version)
}
return &m, nil
}