mirror of
https://github.com/prometheus/prometheus.git
synced 2025-01-27 05:32:27 -08:00
Add initial WAL writing
This commit is contained in:
parent
2a825f6c28
commit
0b8c77361e
26
db.go
26
db.go
|
@ -163,6 +163,7 @@ func (ba *bucketAppender) Commit() error {
|
||||||
type hashedSample struct {
|
type hashedSample struct {
|
||||||
hash uint64
|
hash uint64
|
||||||
labels labels.Labels
|
labels labels.Labels
|
||||||
|
ref uint32
|
||||||
|
|
||||||
t int64
|
t int64
|
||||||
v float64
|
v float64
|
||||||
|
@ -197,18 +198,25 @@ func OpenShard(path string, logger log.Logger) (*Shard, error) {
|
||||||
return nil, err
|
return nil, err
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// TODO(fabxc): get time from client-defined `now` function.
|
||||||
|
baset := time.Now().UnixNano() / int64(time.Millisecond)
|
||||||
|
if len(pbs) > 0 {
|
||||||
|
baset = pbs[0].stats.MaxTime
|
||||||
|
}
|
||||||
|
|
||||||
|
head, err := NewHeadBlock(filepath.Join(path, fmt.Sprintf("%d", baset)), baset)
|
||||||
|
if err != nil {
|
||||||
|
return nil, err
|
||||||
|
}
|
||||||
|
|
||||||
s := &Shard{
|
s := &Shard{
|
||||||
path: path,
|
path: path,
|
||||||
persistCh: make(chan struct{}, 1),
|
persistCh: make(chan struct{}, 1),
|
||||||
logger: logger,
|
logger: logger,
|
||||||
|
head: head,
|
||||||
persisted: pbs,
|
persisted: pbs,
|
||||||
// TODO(fabxc): restore from checkpoint.
|
// TODO(fabxc): restore from checkpoint.
|
||||||
}
|
}
|
||||||
// TODO(fabxc): get base time from pre-existing blocks. Otherwise
|
|
||||||
// it should come from a user defined start timestamp.
|
|
||||||
// Use actual time for now.
|
|
||||||
s.head = NewHeadBlock(time.Now().UnixNano() / int64(time.Millisecond))
|
|
||||||
|
|
||||||
return s, nil
|
return s, nil
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -219,6 +227,7 @@ func (s *Shard) Close() error {
|
||||||
for _, pb := range s.persisted {
|
for _, pb := range s.persisted {
|
||||||
e.Add(pb.Close())
|
e.Add(pb.Close())
|
||||||
}
|
}
|
||||||
|
e.Add(s.head.Close())
|
||||||
|
|
||||||
return e.Err()
|
return e.Err()
|
||||||
}
|
}
|
||||||
|
@ -292,7 +301,12 @@ func (s *Shard) persist() error {
|
||||||
|
|
||||||
// Set new head block.
|
// Set new head block.
|
||||||
head := s.head
|
head := s.head
|
||||||
s.head = NewHeadBlock(head.stats.MaxTime)
|
newHead, err := NewHeadBlock(filepath.Join(s.path, fmt.Sprintf("%d", head.stats.MaxTime)), head.stats.MaxTime)
|
||||||
|
if err != nil {
|
||||||
|
s.mtx.Unlock()
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
s.head = newHead
|
||||||
|
|
||||||
s.mtx.Unlock()
|
s.mtx.Unlock()
|
||||||
|
|
||||||
|
|
72
head.go
72
head.go
|
@ -21,24 +21,36 @@ type HeadBlock struct {
|
||||||
// to their position in the chunk desc slice.
|
// to their position in the chunk desc slice.
|
||||||
hashes map[uint64][]int
|
hashes map[uint64][]int
|
||||||
|
|
||||||
symbols []string // all seen strings
|
|
||||||
values map[string]stringset // label names to possible values
|
values map[string]stringset // label names to possible values
|
||||||
postings *memPostings // postings lists for terms
|
postings *memPostings // postings lists for terms
|
||||||
|
|
||||||
|
wal *WAL
|
||||||
|
|
||||||
stats BlockStats
|
stats BlockStats
|
||||||
}
|
}
|
||||||
|
|
||||||
// NewHeadBlock creates a new empty head block.
|
// NewHeadBlock creates a new empty head block.
|
||||||
func NewHeadBlock(baseTime int64) *HeadBlock {
|
func NewHeadBlock(dir string, baseTime int64) (*HeadBlock, error) {
|
||||||
|
wal, err := CreateWAL(dir)
|
||||||
|
if err != nil {
|
||||||
|
return nil, err
|
||||||
|
}
|
||||||
|
|
||||||
b := &HeadBlock{
|
b := &HeadBlock{
|
||||||
descs: []*chunkDesc{},
|
descs: []*chunkDesc{},
|
||||||
hashes: map[uint64][]int{},
|
hashes: map[uint64][]int{},
|
||||||
values: map[string]stringset{},
|
values: map[string]stringset{},
|
||||||
postings: &memPostings{m: make(map[term][]uint32)},
|
postings: &memPostings{m: make(map[term][]uint32)},
|
||||||
|
wal: wal,
|
||||||
}
|
}
|
||||||
b.stats.MinTime = baseTime
|
b.stats.MinTime = baseTime
|
||||||
|
|
||||||
return b
|
return b, nil
|
||||||
|
}
|
||||||
|
|
||||||
|
// Close syncs all data and closes underlying resources of the head block.
|
||||||
|
func (h *HeadBlock) Close() error {
|
||||||
|
return h.wal.Close()
|
||||||
}
|
}
|
||||||
|
|
||||||
// Querier returns a new querier over the head block.
|
// Querier returns a new querier over the head block.
|
||||||
|
@ -111,15 +123,18 @@ func (h *HeadBlock) Series(ref uint32, mint, maxt int64) (Series, error) {
|
||||||
|
|
||||||
// get retrieves the chunk with the hash and label set and creates
|
// get retrieves the chunk with the hash and label set and creates
|
||||||
// a new one if it doesn't exist yet.
|
// a new one if it doesn't exist yet.
|
||||||
func (h *HeadBlock) get(hash uint64, lset labels.Labels) *chunkDesc {
|
func (h *HeadBlock) get(hash uint64, lset labels.Labels) (*chunkDesc, uint32) {
|
||||||
refs := h.hashes[hash]
|
refs := h.hashes[hash]
|
||||||
|
|
||||||
for _, ref := range refs {
|
for _, ref := range refs {
|
||||||
if cd := h.descs[ref]; cd.lset.Equals(lset) {
|
if cd := h.descs[ref]; cd.lset.Equals(lset) {
|
||||||
return cd
|
return cd, uint32(ref)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
// None of the given chunks was for the series, create a new one.
|
return nil, 0
|
||||||
|
}
|
||||||
|
|
||||||
|
func (h *HeadBlock) create(hash uint64, lset labels.Labels) *chunkDesc {
|
||||||
cd := &chunkDesc{
|
cd := &chunkDesc{
|
||||||
lset: lset,
|
lset: lset,
|
||||||
chunk: chunks.NewXORChunk(int(math.MaxInt64)),
|
chunk: chunks.NewXORChunk(int(math.MaxInt64)),
|
||||||
|
@ -128,7 +143,7 @@ func (h *HeadBlock) get(hash uint64, lset labels.Labels) *chunkDesc {
|
||||||
ref := len(h.descs)
|
ref := len(h.descs)
|
||||||
|
|
||||||
h.descs = append(h.descs, cd)
|
h.descs = append(h.descs, cd)
|
||||||
h.hashes[hash] = append(refs, ref)
|
h.hashes[hash] = append(h.hashes[hash], ref)
|
||||||
|
|
||||||
// Add each label pair as a term to the inverted index.
|
// Add each label pair as a term to the inverted index.
|
||||||
terms := make([]term, 0, len(lset))
|
terms := make([]term, 0, len(lset))
|
||||||
|
@ -153,28 +168,53 @@ func (h *HeadBlock) get(hash uint64, lset labels.Labels) *chunkDesc {
|
||||||
}
|
}
|
||||||
|
|
||||||
func (h *HeadBlock) appendBatch(samples []hashedSample) error {
|
func (h *HeadBlock) appendBatch(samples []hashedSample) error {
|
||||||
var merr MultiError
|
// Find head chunks for all samples and allocate new IDs/refs for
|
||||||
|
// ones we haven't seen before.
|
||||||
|
var (
|
||||||
|
newSeries []labels.Labels
|
||||||
|
newHashes []uint64
|
||||||
|
)
|
||||||
|
|
||||||
for _, s := range samples {
|
for _, s := range samples {
|
||||||
merr.Add(h.append(s.hash, s.labels, s.t, s.v))
|
cd, ref := h.get(s.hash, s.labels)
|
||||||
|
if cd != nil {
|
||||||
|
// TODO(fabxc): sample refs are only scoped within a block for
|
||||||
|
// now and we ignore any previously set value
|
||||||
|
s.ref = ref
|
||||||
|
continue
|
||||||
}
|
}
|
||||||
|
|
||||||
return merr.Err()
|
s.ref = uint32(len(h.descs) + len(newSeries))
|
||||||
|
newSeries = append(newSeries, s.labels)
|
||||||
|
newHashes = append(newHashes, s.hash)
|
||||||
}
|
}
|
||||||
|
|
||||||
// append adds the sample to the headblock.
|
// Write all new series and samples to the WAL and add it to the
|
||||||
func (h *HeadBlock) append(hash uint64, lset labels.Labels, ts int64, v float64) error {
|
// in-mem database on success.
|
||||||
if err := h.get(hash, lset).append(ts, v); err != nil {
|
if err := h.wal.Log(newSeries, samples); err != nil {
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
|
for i, s := range newSeries {
|
||||||
|
h.create(newHashes[i], s)
|
||||||
|
}
|
||||||
|
|
||||||
|
var merr MultiError
|
||||||
|
for _, s := range samples {
|
||||||
|
// TODO(fabxc): ensure that this won't be able to actually error in practice.
|
||||||
|
if err := h.descs[s.ref].append(s.t, s.v); err != nil {
|
||||||
|
merr.Add(err)
|
||||||
|
continue
|
||||||
|
}
|
||||||
|
|
||||||
h.stats.SampleCount++
|
h.stats.SampleCount++
|
||||||
|
|
||||||
if ts > h.stats.MaxTime {
|
if s.t > h.stats.MaxTime {
|
||||||
h.stats.MaxTime = ts
|
h.stats.MaxTime = s.t
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
return nil
|
return merr.Err()
|
||||||
}
|
}
|
||||||
|
|
||||||
func (h *HeadBlock) persist(p string) (int64, error) {
|
func (h *HeadBlock) persist(p string) (int64, error) {
|
||||||
|
|
191
wal.go
Normal file
191
wal.go
Normal file
|
@ -0,0 +1,191 @@
|
||||||
|
package tsdb
|
||||||
|
|
||||||
|
import (
|
||||||
|
"encoding/binary"
|
||||||
|
"hash/crc32"
|
||||||
|
"io"
|
||||||
|
"math"
|
||||||
|
"os"
|
||||||
|
"path/filepath"
|
||||||
|
|
||||||
|
"github.com/coreos/etcd/pkg/fileutil"
|
||||||
|
"github.com/fabxc/tsdb/labels"
|
||||||
|
)
|
||||||
|
|
||||||
|
// WALEntryType indicates what data a WAL entry contains.
|
||||||
|
type WALEntryType byte
|
||||||
|
|
||||||
|
// The valid WAL entry types.
|
||||||
|
const (
|
||||||
|
WALEntrySymbols = 1
|
||||||
|
WALEntrySeries = 2
|
||||||
|
WALEntrySamples = 3
|
||||||
|
)
|
||||||
|
|
||||||
|
// WAL is a write ahead log for series data. It can only be written to.
|
||||||
|
// Use WALReader to read back from a write ahead log.
|
||||||
|
type WAL struct {
|
||||||
|
f *fileutil.LockedFile
|
||||||
|
enc *walEncoder
|
||||||
|
|
||||||
|
symbols map[string]uint32
|
||||||
|
}
|
||||||
|
|
||||||
|
// CreateWAL creates a new write ahead log in the given directory.
|
||||||
|
func CreateWAL(dir string) (*WAL, error) {
|
||||||
|
if err := os.MkdirAll(dir, 0777); err != nil {
|
||||||
|
return nil, err
|
||||||
|
}
|
||||||
|
|
||||||
|
p := filepath.Join(dir, "wal")
|
||||||
|
|
||||||
|
f, err := fileutil.LockFile(p, os.O_WRONLY|os.O_CREATE, fileutil.PrivateFileMode)
|
||||||
|
if err != nil {
|
||||||
|
return nil, err
|
||||||
|
}
|
||||||
|
if _, err = f.Seek(0, os.SEEK_END); err != nil {
|
||||||
|
return nil, err
|
||||||
|
}
|
||||||
|
|
||||||
|
w := &WAL{
|
||||||
|
f: f,
|
||||||
|
enc: newWALEncoder(f),
|
||||||
|
symbols: map[string]uint32{},
|
||||||
|
}
|
||||||
|
return w, nil
|
||||||
|
}
|
||||||
|
|
||||||
|
// Log writes a batch of new series labels and samples to the log.
|
||||||
|
func (w *WAL) Log(series []labels.Labels, samples []hashedSample) error {
|
||||||
|
if err := w.enc.encodeSeries(series); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
if err := w.enc.encodeSamples(samples); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
func (w *WAL) sync() error {
|
||||||
|
return fileutil.Fdatasync(w.f.File)
|
||||||
|
}
|
||||||
|
|
||||||
|
// Close sync all data and closes the underlying resources.
|
||||||
|
func (w *WAL) Close() error {
|
||||||
|
if err := w.sync(); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
return w.f.Close()
|
||||||
|
}
|
||||||
|
|
||||||
|
// OpenWAL does things.
|
||||||
|
func OpenWAL(dir string) (*WAL, error) {
|
||||||
|
return nil, nil
|
||||||
|
}
|
||||||
|
|
||||||
|
type walEncoder struct {
|
||||||
|
w io.Writer
|
||||||
|
|
||||||
|
buf []byte
|
||||||
|
}
|
||||||
|
|
||||||
|
func newWALEncoder(w io.Writer) *walEncoder {
|
||||||
|
return &walEncoder{
|
||||||
|
w: w,
|
||||||
|
buf: make([]byte, 1024*1024),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
func (e *walEncoder) entry(et WALEntryType, flag byte, n int) error {
|
||||||
|
h := crc32.NewIEEE()
|
||||||
|
w := io.MultiWriter(h, e.w)
|
||||||
|
|
||||||
|
b := make([]byte, 6)
|
||||||
|
b[0] = byte(et)
|
||||||
|
b[1] = flag
|
||||||
|
|
||||||
|
binary.BigEndian.PutUint32(b[2:], uint32(len(e.buf)))
|
||||||
|
|
||||||
|
if _, err := w.Write(b); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
if _, err := w.Write(e.buf[:n]); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
if _, err := e.w.Write(h.Sum(nil)); err != nil {
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
|
||||||
|
const (
|
||||||
|
walSeriesSimple = 1
|
||||||
|
walSamplesSimple = 1
|
||||||
|
)
|
||||||
|
|
||||||
|
func (e *walEncoder) encodeSeries(series []labels.Labels) error {
|
||||||
|
if len(series) == 0 {
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
var (
|
||||||
|
b = make([]byte, binary.MaxVarintLen32)
|
||||||
|
buf = e.buf[:0]
|
||||||
|
)
|
||||||
|
|
||||||
|
for _, lset := range series {
|
||||||
|
n := binary.PutUvarint(b, uint64(len(lset)))
|
||||||
|
buf = append(buf, b[:n]...)
|
||||||
|
|
||||||
|
for _, l := range lset {
|
||||||
|
n = binary.PutUvarint(b, uint64(len(l.Name)))
|
||||||
|
buf = append(buf, b[:n]...)
|
||||||
|
|
||||||
|
n = binary.PutUvarint(b, uint64(len(l.Value)))
|
||||||
|
buf = append(buf, b[:n]...)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return e.entry(WALEntrySeries, walSeriesSimple, len(buf))
|
||||||
|
}
|
||||||
|
|
||||||
|
func (e *walEncoder) encodeSamples(samples []hashedSample) error {
|
||||||
|
if len(samples) == 0 {
|
||||||
|
return nil
|
||||||
|
}
|
||||||
|
var (
|
||||||
|
b = make([]byte, binary.MaxVarintLen64)
|
||||||
|
buf = e.buf[:0]
|
||||||
|
)
|
||||||
|
|
||||||
|
// Store base timestamp and base reference number of first sample.
|
||||||
|
// All samples encode their timestamp and ref as delta to those.
|
||||||
|
//
|
||||||
|
// TODO(fabxc): optimize for all samples having the same timestamp.
|
||||||
|
first := samples[0]
|
||||||
|
|
||||||
|
binary.BigEndian.PutUint32(b, first.ref)
|
||||||
|
buf = append(buf, b[:4]...)
|
||||||
|
binary.BigEndian.PutUint64(b, uint64(first.t))
|
||||||
|
buf = append(buf, b[:8]...)
|
||||||
|
|
||||||
|
for _, s := range samples {
|
||||||
|
n := binary.PutVarint(b, int64(s.ref)-int64(first.ref))
|
||||||
|
buf = append(buf, b[:n]...)
|
||||||
|
|
||||||
|
n = binary.PutVarint(b, s.t-first.t)
|
||||||
|
buf = append(buf, b[:n]...)
|
||||||
|
|
||||||
|
binary.BigEndian.PutUint64(b, math.Float64bits(s.v))
|
||||||
|
buf = append(buf, b[:8]...)
|
||||||
|
}
|
||||||
|
|
||||||
|
return e.entry(WALEntrySamples, walSamplesSimple, len(buf))
|
||||||
|
}
|
||||||
|
|
||||||
|
type walDecoder struct {
|
||||||
|
r io.Reader
|
||||||
|
|
||||||
|
handleSeries func(labels.Labels)
|
||||||
|
handleSample func(hashedSample)
|
||||||
|
}
|
Loading…
Reference in a new issue