mirror of
https://github.com/prometheus/prometheus.git
synced 2025-01-12 14:27:27 -08:00
Clarify docs, error on unexpected meta read errors
Signed-off-by: Fabian Reinartz <freinartz@google.com>
This commit is contained in:
parent
af9003dcef
commit
d907928e57
2
block.go
2
block.go
|
@ -178,6 +178,8 @@ type BlockMetaCompaction struct {
|
||||||
Level int `json:"level"`
|
Level int `json:"level"`
|
||||||
// ULIDs of all source head blocks that went into the block.
|
// ULIDs of all source head blocks that went into the block.
|
||||||
Sources []ulid.ULID `json:"sources,omitempty"`
|
Sources []ulid.ULID `json:"sources,omitempty"`
|
||||||
|
// Short descriptions of the direct blocks that were used to create
|
||||||
|
// this block.
|
||||||
Parents []BlockDesc `json:"parents,omitempty"`
|
Parents []BlockDesc `json:"parents,omitempty"`
|
||||||
Failed bool `json:"failed,omitempty"`
|
Failed bool `json:"failed,omitempty"`
|
||||||
}
|
}
|
||||||
|
|
29
db.go
29
db.go
|
@ -326,6 +326,13 @@ func (a dbAppender) Commit() error {
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Compact data if possible. After successful compaction blocks are reloaded
|
||||||
|
// which will also trigger blocks to be deleted that fall out of the retention
|
||||||
|
// window.
|
||||||
|
// If no blocks are compacted, the retention window state doesn't change. Thus,
|
||||||
|
// this is sufficient to reliably delete old data.
|
||||||
|
// Old blocks are only deleted on reload based on the new block's parent information.
|
||||||
|
// See DB.reload documentation for further information.
|
||||||
func (db *DB) compact() (changes bool, err error) {
|
func (db *DB) compact() (changes bool, err error) {
|
||||||
db.cmtx.Lock()
|
db.cmtx.Lock()
|
||||||
defer db.cmtx.Unlock()
|
defer db.cmtx.Unlock()
|
||||||
|
@ -426,8 +433,13 @@ func (db *DB) reload() (err error) {
|
||||||
// We delete old blocks that have been superseded by new ones by gathering all parents
|
// We delete old blocks that have been superseded by new ones by gathering all parents
|
||||||
// from existing blocks. Those parents all have newer replacements and can be safely deleted
|
// from existing blocks. Those parents all have newer replacements and can be safely deleted
|
||||||
// after we loaded the other blocks.
|
// after we loaded the other blocks.
|
||||||
|
// This makes us resilient against the process crashing towards the end of a compaction.
|
||||||
|
// Creation of a new block and deletion of its parents cannot happen atomically. By creating
|
||||||
|
// blocks atomically with their parents, we can pick up the deletion where it left off during
|
||||||
|
// a crash.
|
||||||
var (
|
var (
|
||||||
blocks []*Block
|
blocks []*Block
|
||||||
|
corrupted = map[ulid.ULID]error{}
|
||||||
opened = map[ulid.ULID]struct{}{}
|
opened = map[ulid.ULID]struct{}{}
|
||||||
deleteable = map[ulid.ULID]struct{}{}
|
deleteable = map[ulid.ULID]struct{}{}
|
||||||
)
|
)
|
||||||
|
@ -437,6 +449,13 @@ func (db *DB) reload() (err error) {
|
||||||
// The block was potentially in the middle of being deleted during a crash.
|
// The block was potentially in the middle of being deleted during a crash.
|
||||||
// Skip it since we may delete it properly further down again.
|
// Skip it since we may delete it properly further down again.
|
||||||
level.Warn(db.logger).Log("msg", "read meta information", "err", err, "dir", dir)
|
level.Warn(db.logger).Log("msg", "read meta information", "err", err, "dir", dir)
|
||||||
|
|
||||||
|
ulid, err2 := ulid.Parse(filepath.Base(dir))
|
||||||
|
if err2 != nil {
|
||||||
|
level.Error(db.logger).Log("msg", "not a block dir", "dir", dir)
|
||||||
|
continue
|
||||||
|
}
|
||||||
|
corrupted[ulid] = err
|
||||||
continue
|
continue
|
||||||
}
|
}
|
||||||
if db.beyondRetention(meta) {
|
if db.beyondRetention(meta) {
|
||||||
|
@ -447,11 +466,17 @@ func (db *DB) reload() (err error) {
|
||||||
deleteable[b.ULID] = struct{}{}
|
deleteable[b.ULID] = struct{}{}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
// Blocks we failed to open should all be those we are want to delete anyway.
|
||||||
|
for c, err := range corrupted {
|
||||||
|
if _, ok := deleteable[c]; !ok {
|
||||||
|
return errors.Wrapf(err, "unexpected corrupted block %s", c)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// Load new blocks into memory.
|
||||||
for _, dir := range dirs {
|
for _, dir := range dirs {
|
||||||
meta, err := readMetaFile(dir)
|
meta, err := readMetaFile(dir)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
level.Warn(db.logger).Log("msg", "read meta information", "err", err, "dir", dir)
|
return errors.Wrapf(err, "read meta information %s", dir)
|
||||||
continue
|
|
||||||
}
|
}
|
||||||
// Don't load blocks that are scheduled for deletion.
|
// Don't load blocks that are scheduled for deletion.
|
||||||
if _, ok := deleteable[meta.ULID]; ok {
|
if _, ok := deleteable[meta.ULID]; ok {
|
||||||
|
|
Loading…
Reference in a new issue