2016-12-04 04:16:11 -08:00
|
|
|
package tsdb
|
|
|
|
|
2016-12-09 01:41:51 -08:00
|
|
|
import (
|
|
|
|
"sort"
|
|
|
|
"strings"
|
|
|
|
)
|
2016-12-04 04:16:11 -08:00
|
|
|
|
|
|
|
type memIndex struct {
|
|
|
|
lastID uint32
|
2016-12-09 01:41:51 -08:00
|
|
|
|
|
|
|
forward map[uint32]*chunkDesc // chunk ID to chunk desc
|
|
|
|
values map[string]stringset // label names to possible values
|
|
|
|
postings *memPostings // postings lists for terms
|
|
|
|
}
|
|
|
|
|
|
|
|
// newMemIndex returns a new in-memory index.
|
|
|
|
func newMemIndex() *memIndex {
|
|
|
|
return &memIndex{
|
|
|
|
lastID: 0,
|
|
|
|
forward: make(map[uint32]*chunkDesc),
|
|
|
|
values: make(map[string]stringset),
|
2016-12-10 00:44:00 -08:00
|
|
|
postings: &memPostings{m: make(map[term][]uint32)},
|
2016-12-09 01:41:51 -08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (ix *memIndex) numSeries() int {
|
|
|
|
return len(ix.forward)
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (ix *memIndex) Postings(t term) Postings {
|
2016-12-10 00:44:00 -08:00
|
|
|
return ix.postings.get(t)
|
|
|
|
}
|
|
|
|
|
|
|
|
type term struct {
|
|
|
|
name, value string
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
|
2016-12-09 01:41:51 -08:00
|
|
|
func (ix *memIndex) add(chkd *chunkDesc) {
|
|
|
|
// Add each label pair as a term to the inverted index.
|
2016-12-10 00:44:00 -08:00
|
|
|
terms := make([]term, 0, len(chkd.lset))
|
2016-12-04 04:16:11 -08:00
|
|
|
|
2016-12-09 01:41:51 -08:00
|
|
|
for _, l := range chkd.lset {
|
2016-12-10 00:44:00 -08:00
|
|
|
terms = append(terms, term{name: l.Name, value: l.Value})
|
2016-12-09 01:41:51 -08:00
|
|
|
|
|
|
|
// Add to label name to values index.
|
|
|
|
valset, ok := ix.values[l.Name]
|
|
|
|
if !ok {
|
|
|
|
valset = stringset{}
|
|
|
|
ix.values[l.Name] = valset
|
|
|
|
}
|
|
|
|
valset.set(l.Value)
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
2016-12-09 01:41:51 -08:00
|
|
|
ix.lastID++
|
|
|
|
id := ix.lastID
|
2016-12-04 04:16:11 -08:00
|
|
|
|
2016-12-09 01:41:51 -08:00
|
|
|
ix.postings.add(id, terms...)
|
|
|
|
|
|
|
|
// Store forward index for the returned ID.
|
|
|
|
ix.forward[id] = chkd
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
|
2016-12-09 01:41:51 -08:00
|
|
|
type memPostings struct {
|
2016-12-10 00:44:00 -08:00
|
|
|
m map[term][]uint32
|
2016-12-09 01:41:51 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Postings returns an iterator over the postings list for s.
|
2016-12-14 12:58:29 -08:00
|
|
|
func (p *memPostings) get(t term) Postings {
|
2016-12-10 00:44:00 -08:00
|
|
|
return &listIterator{list: p.m[t], idx: -1}
|
2016-12-09 01:41:51 -08:00
|
|
|
}
|
|
|
|
|
|
|
|
// add adds a document to the index. The caller has to ensure that no
|
|
|
|
// term argument appears twice.
|
2016-12-10 00:44:00 -08:00
|
|
|
func (p *memPostings) add(id uint32, terms ...term) {
|
2016-12-09 01:41:51 -08:00
|
|
|
for _, t := range terms {
|
|
|
|
p.m[t] = append(p.m[t], id)
|
|
|
|
}
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
// Postings provides iterative access over a postings list.
|
|
|
|
type Postings interface {
|
2016-12-13 06:26:58 -08:00
|
|
|
// Next advances the iterator and returns true if another value was found.
|
2016-12-04 04:16:11 -08:00
|
|
|
Next() bool
|
2016-12-13 06:26:58 -08:00
|
|
|
|
2016-12-04 04:16:11 -08:00
|
|
|
// Seek advances the iterator to value v or greater and returns
|
|
|
|
// true if a value was found.
|
|
|
|
Seek(v uint32) bool
|
2016-12-13 06:26:58 -08:00
|
|
|
|
2016-12-04 04:16:11 -08:00
|
|
|
// Value returns the value at the current iterator position.
|
|
|
|
Value() uint32
|
2016-12-13 06:26:58 -08:00
|
|
|
|
|
|
|
// Err returns the last error of the iterator.
|
|
|
|
Err() error
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
// errPostings is an empty iterator that always errors.
|
|
|
|
type errPostings struct {
|
2016-12-13 06:26:58 -08:00
|
|
|
err error
|
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (e errPostings) Next() bool { return false }
|
|
|
|
func (e errPostings) Seek(uint32) bool { return false }
|
|
|
|
func (e errPostings) Value() uint32 { return 0 }
|
|
|
|
func (e errPostings) Err() error { return e.err }
|
2016-12-13 06:26:58 -08:00
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
// Intersect returns a new postings list over the intersection of the
|
|
|
|
// input postings.
|
|
|
|
func Intersect(its ...Postings) Postings {
|
2016-12-04 04:16:11 -08:00
|
|
|
if len(its) == 0 {
|
2016-12-14 12:58:29 -08:00
|
|
|
return errPostings{err: nil}
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
a := its[0]
|
|
|
|
|
|
|
|
for _, b := range its[1:] {
|
2016-12-14 12:58:29 -08:00
|
|
|
a = &intersectPostings{a: a, b: b}
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
return a
|
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
type intersectPostings struct {
|
|
|
|
a, b Postings
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (it *intersectPostings) Value() uint32 {
|
2016-12-04 04:16:11 -08:00
|
|
|
return 0
|
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (it *intersectPostings) Next() bool {
|
2016-12-04 04:16:11 -08:00
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (it *intersectPostings) Seek(id uint32) bool {
|
2016-12-04 04:16:11 -08:00
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (it *intersectPostings) Err() error {
|
2016-12-13 06:26:58 -08:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-12-04 04:16:11 -08:00
|
|
|
// Merge returns a new iterator over the union of the input iterators.
|
2016-12-14 12:58:29 -08:00
|
|
|
func Merge(its ...Postings) Postings {
|
2016-12-04 04:16:11 -08:00
|
|
|
if len(its) == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
a := its[0]
|
|
|
|
|
|
|
|
for _, b := range its[1:] {
|
2016-12-14 12:58:29 -08:00
|
|
|
a = &mergePostings{a: a, b: b}
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
return a
|
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
type mergePostings struct {
|
|
|
|
a, b Postings
|
2016-12-04 04:16:11 -08:00
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (it *mergePostings) Value() uint32 {
|
2016-12-04 04:16:11 -08:00
|
|
|
return 0
|
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (it *mergePostings) Next() bool {
|
2016-12-04 04:16:11 -08:00
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (it *mergePostings) Seek(id uint32) bool {
|
2016-12-04 04:16:11 -08:00
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2016-12-14 12:58:29 -08:00
|
|
|
func (it *mergePostings) Err() error {
|
2016-12-13 06:26:58 -08:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-12-04 04:16:11 -08:00
|
|
|
// listIterator implements the Iterator interface over a plain list.
|
|
|
|
type listIterator struct {
|
|
|
|
list []uint32
|
|
|
|
idx int
|
|
|
|
}
|
|
|
|
|
|
|
|
func (it *listIterator) Value() uint32 {
|
|
|
|
return it.list[it.idx]
|
|
|
|
}
|
|
|
|
|
|
|
|
func (it *listIterator) Next() bool {
|
|
|
|
it.idx++
|
|
|
|
return it.idx < len(it.list)
|
|
|
|
}
|
|
|
|
|
|
|
|
func (it *listIterator) Seek(x uint32) bool {
|
|
|
|
// Do binary search between current position and end.
|
|
|
|
it.idx = sort.Search(len(it.list)-it.idx, func(i int) bool {
|
|
|
|
return it.list[i+it.idx] >= x
|
|
|
|
})
|
|
|
|
return it.idx < len(it.list)
|
|
|
|
}
|
2016-12-09 01:41:51 -08:00
|
|
|
|
2016-12-13 06:26:58 -08:00
|
|
|
func (it *listIterator) Err() error {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-12-09 01:41:51 -08:00
|
|
|
type stringset map[string]struct{}
|
|
|
|
|
|
|
|
func (ss stringset) set(s string) {
|
|
|
|
ss[s] = struct{}{}
|
|
|
|
}
|
|
|
|
|
|
|
|
func (ss stringset) has(s string) bool {
|
|
|
|
_, ok := ss[s]
|
|
|
|
return ok
|
|
|
|
}
|
|
|
|
|
|
|
|
func (ss stringset) String() string {
|
|
|
|
return strings.Join(ss.slice(), ",")
|
|
|
|
}
|
|
|
|
|
|
|
|
func (ss stringset) slice() []string {
|
|
|
|
slice := make([]string, 0, len(ss))
|
|
|
|
for k := range ss {
|
|
|
|
slice = append(slice, k)
|
|
|
|
}
|
|
|
|
sort.Strings(slice)
|
|
|
|
return slice
|
|
|
|
}
|