prometheus/head.go

package tsdb

import (
	"errors"
	"math"
	"sort"
	"sync"
	"time"

	"github.com/bradfitz/slice"
	"github.com/fabxc/tsdb/chunks"
	"github.com/fabxc/tsdb/labels"
	"github.com/go-kit/kit/log"
)

// HeadBlock handles reads and writes of time series data within a time window.
type HeadBlock struct {
	mtx sync.RWMutex
	d   string

	// descs holds all chunk descs for the head block. Each chunk implicitly
	// is assigned the index as its ID.
	descs []*chunkDesc
	// mapping maps a series ID to its position in an ordered list
	// of all series. The orderDirty flag indicates that it has gone stale.
	mapper *positionMapper
	// hashes contains a collision map of label set hashes of chunks
	// to their chunk descs.
	hashes map[uint64][]*chunkDesc

	values   map[string]stringset // label names to possible values
	postings *memPostings         // postings lists for terms

	wal *WAL

	bstats *BlockStats
}

// OpenHeadBlock creates a new empty head block.
func OpenHeadBlock(dir string, l log.Logger) (*HeadBlock, error) {
	wal, err := OpenWAL(dir, log.NewContext(l).With("component", "wal"), 15*time.Second)
	if err != nil {
		return nil, err
	}

	b := &HeadBlock{
		d:        dir,
		descs:    []*chunkDesc{},
		hashes:   map[uint64][]*chunkDesc{},
		values:   map[string]stringset{},
		postings: &memPostings{m: make(map[term][]uint32)},
		wal:      wal,
		mapper:   newPositionMapper(nil),
	}
	b.bstats = &BlockStats{
		MinTime: math.MaxInt64,
		MaxTime: math.MinInt64,
	}

	err = wal.ReadAll(&walHandler{
		series: func(lset labels.Labels) {
			b.create(lset.Hash(), lset)
		},
		sample: func(s hashedSample) {
			cd := b.descs[s.ref]

			// Duplicated from appendBatch – TODO(fabxc): deduplicate?
			if cd.lastTimestamp == s.t && cd.lastValue != s.v {
				return
			}
			cd.append(s.t, s.v)

			if s.t > b.bstats.MaxTime {
				b.bstats.MaxTime = s.t
			}
			if s.t < b.bstats.MinTime {
				b.bstats.MinTime = s.t
			}
			b.bstats.SampleCount++
		},
	})
	if err != nil {
		return nil, err
	}

	b.updateMapping()

	return b, nil
}

// Close syncs all data and closes underlying resources of the head block.
func (h *HeadBlock) Close() error {
	return h.wal.Close()
}

func (h *HeadBlock) dir() string          { return h.d }
func (h *HeadBlock) persisted() bool      { return false }
func (h *HeadBlock) index() IndexReader   { return h }
func (h *HeadBlock) series() SeriesReader { return h }

func (h *HeadBlock) stats() BlockStats {
	h.bstats.mtx.RLock()
	defer h.bstats.mtx.RUnlock()

	return *h.bstats
}

// Chunk returns the chunk for the reference number.
func (h *HeadBlock) Chunk(ref uint32) (chunks.Chunk, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	if int(ref) >= len(h.descs) {
		return nil, errNotFound
	}
	return h.descs[int(ref)].chunk, nil
}

func (h *HeadBlock) interval() (int64, int64) {
	return h.bstats.MinTime, h.bstats.MaxTime
}

// Stats returns statisitics about the indexed data.
func (h *HeadBlock) Stats() (BlockStats, error) {
	return *h.bstats, nil
}

// LabelValues returns the possible label values
func (h *HeadBlock) LabelValues(names ...string) (StringTuples, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	if len(names) != 1 {
		return nil, errInvalidSize
	}
	var sl []string

	for s := range h.values[names[0]] {
		sl = append(sl, s)
	}
	sort.Strings(sl)

	return &stringTuples{l: len(names), s: sl}, nil
}

// Postings returns the postings list iterator for the label pair.
func (h *HeadBlock) Postings(name, value string) (Postings, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	return h.postings.get(term{name: name, value: value}), nil
}

// Series returns the series for the given reference.
func (h *HeadBlock) Series(ref uint32) (labels.Labels, []ChunkMeta, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	if int(ref) >= len(h.descs) {
		return nil, nil, errNotFound
	}
	cd := h.descs[ref]

	meta := ChunkMeta{
		MinTime: cd.firstTimestamp,
		MaxTime: cd.lastTimestamp,
		Ref:     ref,
	}
	return cd.lset, []ChunkMeta{meta}, nil
}

func (h *HeadBlock) LabelIndices() ([][]string, error) {
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	res := [][]string{}

	for s := range h.values {
		res = append(res, []string{s})
	}
	return res, nil
}

// get retrieves the chunk with the hash and label set and creates
// a new one if it doesn't exist yet.
func (h *HeadBlock) get(hash uint64, lset labels.Labels) *chunkDesc {
	cds := h.hashes[hash]

	for _, cd := range cds {
		if cd.lset.Equals(lset) {
			return cd
		}
	}
	return nil
}

func (h *HeadBlock) create(hash uint64, lset labels.Labels) *chunkDesc {
	cd := &chunkDesc{
		lset:          lset,
		chunk:         chunks.NewXORChunk(),
		lastTimestamp: math.MinInt64,
	}

	var err error
	cd.app, err = cd.chunk.Appender()
	if err != nil {
		// Getting an Appender for a new chunk must not panic.
		panic(err)
	}
	// Index the new chunk.
	cd.ref = uint32(len(h.descs))

	h.descs = append(h.descs, cd)
	h.hashes[hash] = append(h.hashes[hash], cd)

	for _, l := range lset {
		valset, ok := h.values[l.Name]
		if !ok {
			valset = stringset{}
			h.values[l.Name] = valset
		}
		valset.set(l.Value)

		h.postings.add(cd.ref, term{name: l.Name, value: l.Value})
	}

	h.postings.add(cd.ref, term{})

	return cd
}

var (
	// ErrOutOfOrderSample is returned if an appended sample has a
	// timestamp larger than the most recent sample.
	ErrOutOfOrderSample = errors.New("out of order sample")

	// ErrAmendSample is returned if an appended sample has the same timestamp
	// as the most recent sample but a different value.
	ErrAmendSample = errors.New("amending sample")
)

func (h *HeadBlock) appendBatch(samples []hashedSample) error {
	// Find head chunks for all samples and allocate new IDs/refs for
	// ones we haven't seen before.
	var (
		newSeries    []labels.Labels
		newSamples   []*hashedSample
		newHashes    []uint64
		uniqueHashes = map[uint64]uint32{}
	)
	h.mtx.RLock()
	defer h.mtx.RUnlock()

	for i := range samples {
		s := &samples[i]

		cd := h.get(s.hash, s.labels)
		if cd != nil {
			// Samples must only occur in order.
			if s.t < cd.lastTimestamp {
				return ErrOutOfOrderSample
			}
			if cd.lastTimestamp == s.t && cd.lastValue != s.v {
				return ErrAmendSample
			}
			// TODO(fabxc): sample refs are only scoped within a block for
			// now and we ignore any previously set value
			s.ref = cd.ref
			continue
		}

		// There may be several samples for a new series in a batch.
		// We don't want to reserve a new space for each.
		if ref, ok := uniqueHashes[s.hash]; ok {
			s.ref = ref
			continue
		}
		s.ref = uint32(len(newSeries))
		uniqueHashes[s.hash] = s.ref

		newSeries = append(newSeries, s.labels)
		newHashes = append(newHashes, s.hash)
		newSamples = append(newSamples, s)
	}

	// Write all new series and samples to the WAL and add it to the
	// in-mem database on success.
	if err := h.wal.Log(newSeries, samples); err != nil {
		return err
	}

	// After the samples were successfully written to the WAL, there may
	// be no further failures.
	if len(newSeries) > 0 {
		h.mtx.RUnlock()
		h.mtx.Lock()

		base := len(h.descs)

		for i, s := range newSeries {
			h.create(newHashes[i], s)
		}
		for _, s := range newSamples {
			s.ref = uint32(base) + s.ref
		}

		h.mtx.Unlock()
		h.mtx.RLock()
	}

	var (
		total = uint64(len(samples))
		mint  = int64(math.MaxInt64)
		maxt  = int64(math.MinInt64)
	)
	for _, s := range samples {
		cd := h.descs[s.ref]
		// Skip duplicate samples.
		if cd.lastTimestamp == s.t && cd.lastValue != s.v {
			total--
			continue
		}
		cd.append(s.t, s.v)

		if mint > s.t {
			mint = s.t
		}
		if maxt < s.t {
			maxt = s.t
		}
	}

	h.bstats.mtx.Lock()
	defer h.bstats.mtx.Unlock()

	h.bstats.SampleCount += total
	h.bstats.SeriesCount += uint64(len(newSeries))
	h.bstats.ChunkCount += uint64(len(newSeries)) // head block has one chunk/series

	if mint < h.bstats.MinTime {
		h.bstats.MinTime = mint
	}
	if maxt > h.bstats.MaxTime {
		h.bstats.MaxTime = maxt
	}

	return nil
}

func (h *HeadBlock) fullness() float64 {
	h.bstats.mtx.RLock()
	defer h.bstats.mtx.RUnlock()

	return float64(h.bstats.SampleCount) / float64(h.bstats.SeriesCount+1) / 250
}

func (h *HeadBlock) updateMapping() {
	h.mapper.mtx.Lock()
	defer h.mapper.mtx.Unlock()

	if h.mapper.sortable != nil && h.mapper.Len() == len(h.descs) {
		return
	}

	cds := make([]*chunkDesc, len(h.descs))
	copy(cds, h.descs)

	s := slice.SortInterface(cds, func(i, j int) bool {
		return labels.Compare(cds[i].lset, cds[j].lset) < 0
	})

	h.mapper.update(s)
}

// remapPostings changes the order of the postings from their ID to the ordering
// of the series they reference.
// Returned postings have no longer monotonic IDs and MUST NOT be used for regular
// postings set operations, i.e. intersect and merge.
func (h *HeadBlock) remapPostings(p Postings) Postings {
	list, err := expandPostings(p)
	if err != nil {
		return errPostings{err: err}
	}

	h.mapper.mtx.RLock()
	defer h.mapper.mtx.RUnlock()

	h.mapper.Sort(list)

	slice.Sort(list, func(i, j int) bool {
		return h.mapper.fw[list[i]] < h.mapper.fw[list[j]]
	})

	return newListPostings(list)
}

// positionMapper stores a position mapping from unsorted to
// sorted indices of a sortable collection.
type positionMapper struct {
	mtx      sync.RWMutex
	sortable sort.Interface
	iv, fw   []int
}

func newPositionMapper(s sort.Interface) *positionMapper {
	m := &positionMapper{}
	if s != nil {
		m.update(s)
	}
	return m
}

func (m *positionMapper) Len() int           { return m.sortable.Len() }
func (m *positionMapper) Less(i, j int) bool { return m.sortable.Less(i, j) }

func (m *positionMapper) Swap(i, j int) {
	m.sortable.Swap(i, j)

	m.iv[i], m.iv[j] = m.iv[j], m.iv[i]
}

func (m *positionMapper) Sort(l []uint32) {
	slice.Sort(l, func(i, j int) bool {
		return m.fw[l[i]] < m.fw[l[j]]
	})
}

func (m *positionMapper) update(s sort.Interface) {
	m.sortable = s

	m.iv = make([]int, s.Len())
	m.fw = make([]int, s.Len())

	for i := range m.iv {
		m.iv[i] = i
	}
	sort.Sort(m)

	for i, k := range m.iv {
		m.fw[k] = i
	}
}
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+								package tsdb
 								import (
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+									"errors"
-												Fix last timestamp initialization

This initializes the chunkDesc's last timestamp to the minimum
value so initial samples with a timestamp of 0 (e.g. in tests)
are not accidentally dropped.

											
										
										
											2017-01-04 05:06:40 -08:00
+									"math"
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+									"sort"
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+									"sync"
-												Periodically fsync WAL, make head cut async

											
										
										
											2017-01-06 06:18:06 -08:00
+									"time"
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											2017-01-05 06:13:01 -08:00
+									"github.com/bradfitz/slice"
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+									"github.com/fabxc/tsdb/chunks"
-												Extract labels package

											
										
										
											2016-12-21 00:39:01 -08:00
+									"github.com/fabxc/tsdb/labels"
-												Periodically fsync WAL, make head cut async

											
										
										
											2017-01-06 06:18:06 -08:00
+									"github.com/go-kit/kit/log"
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+								)
 								// HeadBlock handles reads and writes of time series data within a time window.
 								type HeadBlock struct {
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									mtx sync.RWMutex
-												Lock mmapped files

											
										
										
											2017-01-03 01:09:20 -08:00
+									d   string
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
 									// descs holds all chunk descs for the head block. Each chunk implicitly
 									// is assigned the index as its ID.
 									descs []*chunkDesc
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											2017-01-05 06:13:01 -08:00
+									// mapping maps a series ID to its position in an ordered list
 									// of all series. The orderDirty flag indicates that it has gone stale.
 									mapper *positionMapper
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									// hashes contains a collision map of label set hashes of chunks
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+									// to their chunk descs.
 									hashes map[uint64][]*chunkDesc
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
 									values   map[string]stringset // label names to possible values
 									postings *memPostings         // postings lists for terms
-												Bucket samples before appending.

This pre-sorts samples into buckets before appending them to reduce
locking of shards.

											
										
										
											2016-12-07 08:10:49 -08:00
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+									wal *WAL
-												Fix races

											
										
										
											2017-01-07 07:20:32 -08:00
+									bstats *BlockStats
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+								}
-												Rename to OpenHeadBlock

											
										
										
											2016-12-22 11:00:24 -08:00
+								// OpenHeadBlock creates a new empty head block.
-												Periodically fsync WAL, make head cut async

											
										
										
											2017-01-06 06:18:06 -08:00
+								func OpenHeadBlock(dir string, l log.Logger) (*HeadBlock, error) {
 									wal, err := OpenWAL(dir, log.NewContext(l).With("component", "wal"), 15*time.Second)
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+									if err != nil {
 										return nil, err
 									}
-												Add stats serialization, load querier of all blocks

											
										
										
											2016-12-15 07:14:33 -08:00
+									b := &HeadBlock{
-												Lock mmapped files

											
										
										
											2017-01-03 01:09:20 -08:00
+										d:        dir,
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+										descs:    []*chunkDesc{},
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+										hashes:   map[uint64][]*chunkDesc{},
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+										values:   map[string]stringset{},
 										postings: &memPostings{m: make(map[term][]uint32)},
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+										wal:      wal,
-												Don't update head postings mapper on every append

											
										
										
											2017-01-06 07:27:50 -08:00
+										mapper:   newPositionMapper(nil),
-												Move sub-indexes into single index structure

											
										
										
											2016-12-09 01:41:51 -08:00
+									}
-												Fix races

											
										
										
											2017-01-07 07:20:32 -08:00
+									b.bstats = &BlockStats{
 										MinTime: math.MaxInt64,
 										MaxTime: math.MinInt64,
 									}
-												Handle compaction trigger and reinitializing in DB

											
										
										
											2017-01-06 03:37:28 -08:00
-												Add WAL decoder+loading and benchmarks

											
										
										
											2016-12-22 06:18:33 -08:00
+									err = wal.ReadAll(&walHandler{
 										series: func(lset labels.Labels) {
 											b.create(lset.Hash(), lset)
 										},
 										sample: func(s hashedSample) {
-												Switch to sequential block names

This changes block directory names from the int64 timestamp
to sequential numbering.

											
										
										
											2017-01-06 00:26:39 -08:00
+											cd := b.descs[s.ref]
 											// Duplicated from appendBatch – TODO(fabxc): deduplicate?
 											if cd.lastTimestamp == s.t && cd.lastValue != s.v {
 												return
 											}
 											cd.append(s.t, s.v)
 											if s.t > b.bstats.MaxTime {
 												b.bstats.MaxTime = s.t
 											}
 											if s.t < b.bstats.MinTime {
 												b.bstats.MinTime = s.t
 											}
-												Consolidate persistence and compaction

											
										
										
											2017-01-03 06:43:26 -08:00
+											b.bstats.SampleCount++
-												Add WAL decoder+loading and benchmarks

											
										
										
											2016-12-22 06:18:33 -08:00
+										},
 									})
 									if err != nil {
 										return nil, err
 									}
-												Don't update head postings mapper on every append

											
										
										
											2017-01-06 07:27:50 -08:00
+									b.updateMapping()
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											2017-01-05 06:13:01 -08:00
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+									return b, nil
 								}
 								// Close syncs all data and closes underlying resources of the head block.
 								func (h *HeadBlock) Close() error {
 									return h.wal.Close()
-												Move sub-indexes into single index structure

											
										
										
											2016-12-09 01:41:51 -08:00
+								}
-												Lock mmapped files

											
										
										
											2017-01-03 01:09:20 -08:00
+								func (h *HeadBlock) dir() string          { return h.d }
-												Consolidate persistence and compaction

											
										
										
											2017-01-03 06:43:26 -08:00
+								func (h *HeadBlock) persisted() bool      { return false }
-												Lock mmapped files

											
										
										
											2017-01-03 01:09:20 -08:00
+								func (h *HeadBlock) index() IndexReader   { return h }
 								func (h *HeadBlock) series() SeriesReader { return h }
-												Fix head block stats races

											
										
										
											2017-01-07 09:02:17 -08:00
 								func (h *HeadBlock) stats() BlockStats {
 									h.bstats.mtx.RLock()
 									defer h.bstats.mtx.RUnlock()
 									return *h.bstats
 								}
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
-												Add stats serialization, load querier of all blocks

											
										
										
											2016-12-15 07:14:33 -08:00
+								// Chunk returns the chunk for the reference number.
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+								func (h *HeadBlock) Chunk(ref uint32) (chunks.Chunk, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									if int(ref) >= len(h.descs) {
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+										return nil, errNotFound
 									}
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									return h.descs[int(ref)].chunk, nil
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+								}
-												Add stats serialization, load querier of all blocks

											
										
										
											2016-12-15 07:14:33 -08:00
+								func (h *HeadBlock) interval() (int64, int64) {
-												Consolidate persistence and compaction

											
										
										
											2017-01-03 06:43:26 -08:00
+									return h.bstats.MinTime, h.bstats.MaxTime
-												Add stats serialization, load querier of all blocks

											
										
										
											2016-12-15 07:14:33 -08:00
+								}
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+								// Stats returns statisitics about the indexed data.
-												Add stats serialization, load querier of all blocks

											
										
										
											2016-12-15 07:14:33 -08:00
+								func (h *HeadBlock) Stats() (BlockStats, error) {
-												Fix races

											
										
										
											2017-01-07 07:20:32 -08:00
+									return *h.bstats, nil
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+								}
 								// LabelValues returns the possible label values
 								func (h *HeadBlock) LabelValues(names ...string) (StringTuples, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+									if len(names) != 1 {
 										return nil, errInvalidSize
 									}
 									var sl []string
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									for s := range h.values[names[0]] {
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+										sl = append(sl, s)
 									}
 									sort.Strings(sl)
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											2017-01-05 06:13:01 -08:00
+									return &stringTuples{l: len(names), s: sl}, nil
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+								}
 								// Postings returns the postings list iterator for the label pair.
-												Rename Iterator to Postings

											
										
										
											2016-12-14 12:58:29 -08:00
+								func (h *HeadBlock) Postings(name, value string) (Postings, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									return h.postings.get(term{name: name, value: value}), nil
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+								}
 								// Series returns the series for the given reference.
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+								func (h *HeadBlock) Series(ref uint32) (labels.Labels, []ChunkMeta, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									if int(ref) >= len(h.descs) {
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+										return nil, nil, errNotFound
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+									}
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									cd := h.descs[ref]
-												Consolidate persistence and compaction

											
										
										
											2017-01-03 06:43:26 -08:00
+									meta := ChunkMeta{
-												Fix last timestamp initialization

This initializes the chunkDesc's last timestamp to the minimum
value so initial samples with a timestamp of 0 (e.g. in tests)
are not accidentally dropped.

											
										
										
											2017-01-04 05:06:40 -08:00
+										MinTime: cd.firstTimestamp,
-												Consolidate persistence and compaction

											
										
										
											2017-01-03 06:43:26 -08:00
+										MaxTime: cd.lastTimestamp,
 										Ref:     ref,
 									}
 									return cd.lset, []ChunkMeta{meta}, nil
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+								}
 								func (h *HeadBlock) LabelIndices() ([][]string, error) {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+									h.mtx.RLock()
 									defer h.mtx.RUnlock()
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+									res := [][]string{}
 									for s := range h.values {
 										res = append(res, []string{s})
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+									}
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+									return res, nil
-												Misc fixes for initial Prometheus integration

											
										
										
											2016-12-14 09:38:46 -08:00
+								}
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+								// get retrieves the chunk with the hash and label set and creates
 								// a new one if it doesn't exist yet.
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+								func (h *HeadBlock) get(hash uint64, lset labels.Labels) *chunkDesc {
 									cds := h.hashes[hash]
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+									for _, cd := range cds {
 										if cd.lset.Equals(lset) {
 											return cd
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+										}
 									}
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+									return nil
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+								}
 								func (h *HeadBlock) create(hash uint64, lset labels.Labels) *chunkDesc {
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+									cd := &chunkDesc{
-												Fix last timestamp initialization

This initializes the chunkDesc's last timestamp to the minimum
value so initial samples with a timestamp of 0 (e.g. in tests)
are not accidentally dropped.

											
										
										
											2017-01-04 05:06:40 -08:00
+										lset:          lset,
 										chunk:         chunks.NewXORChunk(),
 										lastTimestamp: math.MinInt64,
-												Append to chunks cannot error

											
										
										
											2016-12-31 01:10:27 -08:00
+									}
-												Fix last timestamp initialization

This initializes the chunkDesc's last timestamp to the minimum
value so initial samples with a timestamp of 0 (e.g. in tests)
are not accidentally dropped.

											
										
										
											2017-01-04 05:06:40 -08:00
-												Switch to sequential block names

This changes block directory names from the int64 timestamp
to sequential numbering.

											
										
										
											2017-01-06 00:26:39 -08:00
+									var err error
-												Append to chunks cannot error

											
										
										
											2016-12-31 01:10:27 -08:00
+									cd.app, err = cd.chunk.Appender()
 									if err != nil {
 										// Getting an Appender for a new chunk must not panic.
 										panic(err)
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+									}
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									// Index the new chunk.
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+									cd.ref = uint32(len(h.descs))
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
 									h.descs = append(h.descs, cd)
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+									h.hashes[hash] = append(h.hashes[hash], cd)
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
 									for _, l := range lset {
 										valset, ok := h.values[l.Name]
 										if !ok {
 											valset = stringset{}
 											h.values[l.Name] = valset
 										}
 										valset.set(l.Value)
-												Consolidate persistence and compaction

											
										
										
											2017-01-03 06:43:26 -08:00
 										h.postings.add(cd.ref, term{name: l.Name, value: l.Value})
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
+									}
-												Consolidate persistence and compaction

											
										
										
											2017-01-03 06:43:26 -08:00
 									h.postings.add(cd.ref, term{})
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
-												misc

											
										
										
											2016-12-09 01:00:14 -08:00
+									return cd
-												Add new interfaces and skeleton

											
										
										
											2016-12-04 04:16:11 -08:00
+								}
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+								var (
-												Run persistence in separate goroutine

											
										
										
											2017-01-02 13:24:35 -08:00
+									// ErrOutOfOrderSample is returned if an appended sample has a
 									// timestamp larger than the most recent sample.
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+									ErrOutOfOrderSample = errors.New("out of order sample")
-												Run persistence in separate goroutine

											
										
										
											2017-01-02 13:24:35 -08:00
 									// ErrAmendSample is returned if an appended sample has the same timestamp
 									// as the most recent sample but a different value.
 									ErrAmendSample = errors.New("amending sample")
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+								)
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+								func (h *HeadBlock) appendBatch(samples []hashedSample) error {
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+									// Find head chunks for all samples and allocate new IDs/refs for
 									// ones we haven't seen before.
 									var (
-												Fix uniqueness of new series

											
										
										
											2016-12-26 07:55:32 -08:00
+										newSeries    []labels.Labels
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+										newSamples   []*hashedSample
-												Fix uniqueness of new series

											
										
										
											2016-12-26 07:55:32 -08:00
+										newHashes    []uint64
 										uniqueHashes = map[uint64]uint32{}
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+									)
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+									h.mtx.RLock()
-												Fix races

											
										
										
											2017-01-07 07:20:32 -08:00
+									defer h.mtx.RUnlock()
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
-												Fix erroneous value assignments

											
										
										
											2016-12-22 11:57:00 -08:00
+									for i := range samples {
 										s := &samples[i]
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+										cd := h.get(s.hash, s.labels)
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+										if cd != nil {
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+											// Samples must only occur in order.
 											if s.t < cd.lastTimestamp {
 												return ErrOutOfOrderSample
 											}
 											if cd.lastTimestamp == s.t && cd.lastValue != s.v {
 												return ErrAmendSample
 											}
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+											// TODO(fabxc): sample refs are only scoped within a block for
 											// now and we ignore any previously set value
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+											s.ref = cd.ref
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+											continue
 										}
-												Fix uniqueness of new series

											
										
										
											2016-12-26 07:55:32 -08:00
 										// There may be several samples for a new series in a batch.
 										// We don't want to reserve a new space for each.
 										if ref, ok := uniqueHashes[s.hash]; ok {
 											s.ref = ref
 											continue
 										}
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+										s.ref = uint32(len(newSeries))
-												Fix uniqueness of new series

											
										
										
											2016-12-26 07:55:32 -08:00
+										uniqueHashes[s.hash] = s.ref
-												Fix erroneous value assignments

											
										
										
											2016-12-22 11:57:00 -08:00
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+										newSeries = append(newSeries, s.labels)
 										newHashes = append(newHashes, s.hash)
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+										newSamples = append(newSamples, s)
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+									}
-												Consolidate mem index into HeadBlock

											
										
										
											2016-12-21 16:12:28 -08:00
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+									// Write all new series and samples to the WAL and add it to the
 									// in-mem database on success.
 									if err := h.wal.Log(newSeries, samples); err != nil {
-												Bucket samples before appending.

This pre-sorts samples into buckets before appending them to reduce
locking of shards.

											
										
										
											2016-12-07 08:10:49 -08:00
+										return err
 									}
-												Add initial seriailization of block data

											
										
										
											2016-12-08 08:43:10 -08:00
-												Remove double-reference in chunk hashmap

											
										
										
											2016-12-31 01:19:02 -08:00
+									// After the samples were successfully written to the WAL, there may
 									// be no further failures.
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+									if len(newSeries) > 0 {
-												Fix races

											
										
										
											2017-01-07 07:20:32 -08:00
+										h.mtx.RUnlock()
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+										h.mtx.Lock()
 										base := len(h.descs)
 										for i, s := range newSeries {
 											h.create(newHashes[i], s)
 										}
 										for _, s := range newSamples {
 											s.ref = uint32(base) + s.ref
 										}
 										h.mtx.Unlock()
 										h.mtx.RLock()
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+									}
-												cleanup and switching removal of unsafe calls.

											
										
										
											2016-12-10 09:08:50 -08:00
-												Fix head block stats races

											
										
										
											2017-01-07 09:02:17 -08:00
+									var (
 										total = uint64(len(samples))
 										mint  = int64(math.MaxInt64)
 										maxt  = int64(math.MinInt64)
 									)
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+									for _, s := range samples {
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+										cd := h.descs[s.ref]
 										// Skip duplicate samples.
 										if cd.lastTimestamp == s.t && cd.lastValue != s.v {
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
+											total--
-												Modify IndexReader API to accomodate compaction

This changes the IndexReader API to expose plain labels
and chunk meta information instead of a Series interface.
Dropping of irrelevant chunks is moved into the querier.

A LabelIndices method is added to query for existing label
value indices.

											
										
										
											2016-12-31 06:35:08 -08:00
+											continue
 										}
 										cd.append(s.t, s.v)
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
-												Fix head block stats races

											
										
										
											2017-01-07 09:02:17 -08:00
+										if mint > s.t {
 											mint = s.t
-												Add initial WAL writing

											
										
										
											2016-12-22 03:05:24 -08:00
+										}
-												Fix head block stats races

											
										
										
											2017-01-07 09:02:17 -08:00
+										if maxt < s.t {
 											maxt = s.t
-												Switch to sequential block names

This changes block directory names from the int64 timestamp
to sequential numbering.

											
										
										
											2017-01-06 00:26:39 -08:00
+										}
-												misc

											
										
										
											2016-12-09 01:00:14 -08:00
+									}
-												Add stats serialization, load querier of all blocks

											
										
										
											2016-12-15 07:14:33 -08:00
-												Fix head block stats races

											
										
										
											2017-01-07 09:02:17 -08:00
+									h.bstats.mtx.Lock()
 									defer h.bstats.mtx.Unlock()
 									h.bstats.SampleCount += total
 									h.bstats.SeriesCount += uint64(len(newSeries))
 									h.bstats.ChunkCount += uint64(len(newSeries)) // head block has one chunk/series
 									if mint < h.bstats.MinTime {
 										h.bstats.MinTime = mint
 									}
 									if maxt > h.bstats.MaxTime {
 										h.bstats.MaxTime = maxt
 									}
-												Use separate lock for series creation

This uses the head block's own lock to only lock if new series were
encountered.
In the general append case we just need to hold a

											
										
										
											2017-01-06 08:23:12 -08:00
-												Append to chunks cannot error

											
										
										
											2016-12-31 01:10:27 -08:00
+									return nil
-												Add initial seriailization of block data

											
										
										
											2016-12-08 08:43:10 -08:00
+								}
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											2017-01-05 06:13:01 -08:00
-												Fix head block stats races

											
										
										
											2017-01-07 09:02:17 -08:00
+								func (h *HeadBlock) fullness() float64 {
 									h.bstats.mtx.RLock()
 									defer h.bstats.mtx.RUnlock()
 									return float64(h.bstats.SampleCount) / float64(h.bstats.SeriesCount+1) / 250
 								}
-												Don't update head postings mapper on every append

											
										
										
											2017-01-06 07:27:50 -08:00
+								func (h *HeadBlock) updateMapping() {
 									h.mapper.mtx.Lock()
 									defer h.mapper.mtx.Unlock()
 									if h.mapper.sortable != nil && h.mapper.Len() == len(h.descs) {
 										return
 									}
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											2017-01-05 06:13:01 -08:00
+									cds := make([]*chunkDesc, len(h.descs))
 									copy(cds, h.descs)
 									s := slice.SortInterface(cds, func(i, j int) bool {
 										return labels.Compare(cds[i].lset, cds[j].lset) < 0
 									})
-												Don't update head postings mapper on every append

											
										
										
											2017-01-06 07:27:50 -08:00
+									h.mapper.update(s)
 								}
 								// remapPostings changes the order of the postings from their ID to the ordering
 								// of the series they reference.
 								// Returned postings have no longer monotonic IDs and MUST NOT be used for regular
 								// postings set operations, i.e. intersect and merge.
 								func (h *HeadBlock) remapPostings(p Postings) Postings {
 									list, err := expandPostings(p)
 									if err != nil {
 										return errPostings{err: err}
 									}
 									h.mapper.mtx.RLock()
 									defer h.mapper.mtx.RUnlock()
 									h.mapper.Sort(list)
 									slice.Sort(list, func(i, j int) bool {
 										return h.mapper.fw[list[i]] < h.mapper.fw[list[j]]
 									})
 									return newListPostings(list)
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											2017-01-05 06:13:01 -08:00
+								}
 								// positionMapper stores a position mapping from unsorted to
 								// sorted indices of a sortable collection.
 								type positionMapper struct {
-												Don't update head postings mapper on every append

											
										
										
											2017-01-06 07:27:50 -08:00
+									mtx      sync.RWMutex
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											2017-01-05 06:13:01 -08:00
+									sortable sort.Interface
 									iv, fw   []int
 								}
 								func newPositionMapper(s sort.Interface) *positionMapper {
-												Don't update head postings mapper on every append

											
										
										
											2017-01-06 07:27:50 -08:00
+									m := &positionMapper{}
 									if s != nil {
 										m.update(s)
-												Add postings wrapper that emits head postings in label set order

This adds a position mapper that takes series from a head block
in the order they were appended and creates a mapping representing
them in order of their label sets.

Write-repair of the postings list would cause very expensive writing.
Hence, we keep them as they are and only apply the postition mapping
at the very end, after a postings list has been sufficienctly reduced
through intersections etc.

											
										
										
											2017-01-05 06:13:01 -08:00
+									}
 									return m
 								}
 								func (m *positionMapper) Len() int           { return m.sortable.Len() }
 								func (m *positionMapper) Less(i, j int) bool { return m.sortable.Less(i, j) }
 								func (m *positionMapper) Swap(i, j int) {
 									m.sortable.Swap(i, j)
 									m.iv[i], m.iv[j] = m.iv[j], m.iv[i]
 								}
-												Don't update head postings mapper on every append

											
										
										
											2017-01-06 07:27:50 -08:00
 								func (m *positionMapper) Sort(l []uint32) {
 									slice.Sort(l, func(i, j int) bool {
 										return m.fw[l[i]] < m.fw[l[j]]
 									})
 								}
 								func (m *positionMapper) update(s sort.Interface) {
 									m.sortable = s
 									m.iv = make([]int, s.Len())
 									m.fw = make([]int, s.Len())
 									for i := range m.iv {
 										m.iv[i] = i
 									}
 									sort.Sort(m)
 									for i, k := range m.iv {
 										m.fw[k] = i
 									}
 								}