2013-02-07 02:38:01 -08:00
// Copyright 2013 Prometheus Team
2012-12-09 07:27:12 -08:00
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
2013-02-08 09:03:26 -08:00
package metric
2012-12-09 07:27:12 -08:00
import (
"code.google.com/p/goprotobuf/proto"
2013-02-08 09:03:26 -08:00
"flag"
2013-04-28 05:47:43 -07:00
"fmt"
2013-01-27 09:49:45 -08:00
"github.com/prometheus/prometheus/coding"
"github.com/prometheus/prometheus/model"
dto "github.com/prometheus/prometheus/model/generated"
2013-02-06 08:06:39 -08:00
"github.com/prometheus/prometheus/storage"
2013-02-08 09:03:26 -08:00
index "github.com/prometheus/prometheus/storage/raw/index/leveldb"
leveldb "github.com/prometheus/prometheus/storage/raw/leveldb"
2013-01-27 09:49:45 -08:00
"github.com/prometheus/prometheus/utility"
2013-02-08 09:03:26 -08:00
"log"
2013-02-08 09:03:26 -08:00
"sort"
2013-03-04 11:43:07 -08:00
"sync"
2012-12-12 03:53:34 -08:00
"time"
2012-12-09 07:27:12 -08:00
)
2013-02-08 09:03:26 -08:00
var (
2013-03-12 10:20:16 -07:00
leveldbChunkSize = flag . Int ( "leveldbChunkSize" , 200 , "Maximum number of samples stored under one key." )
sortConcurrency = 2
2013-02-08 09:03:26 -08:00
)
type LevelDBMetricPersistence struct {
2013-05-02 03:49:13 -07:00
CurationRemarks * leveldb . LevelDBPersistence
2013-02-08 09:03:26 -08:00
fingerprintToMetrics * leveldb . LevelDBPersistence
labelNameToFingerprints * leveldb . LevelDBPersistence
labelSetToFingerprints * leveldb . LevelDBPersistence
2013-05-02 03:49:13 -07:00
MetricHighWatermarks * leveldb . LevelDBPersistence
2013-02-08 09:03:26 -08:00
metricMembershipIndex * index . LevelDBMembershipIndex
2013-05-02 03:49:13 -07:00
MetricSamples * leveldb . LevelDBPersistence
2013-02-08 09:03:26 -08:00
}
var (
// These flag values are back of the envelope, though they seem sensible.
// Please re-evaluate based on your own needs.
2013-04-28 05:47:43 -07:00
curationRemarksCacheSize = flag . Int ( "curationRemarksCacheSize" , 50 * 1024 * 1024 , "The size for the curation remarks cache (bytes)." )
2013-02-08 09:03:26 -08:00
fingerprintsToLabelPairCacheSize = flag . Int ( "fingerprintsToLabelPairCacheSizeBytes" , 100 * 1024 * 1024 , "The size for the fingerprint to label pair index (bytes)." )
2013-03-14 19:24:28 -07:00
highWatermarkCacheSize = flag . Int ( "highWatermarksByFingerprintSizeBytes" , 50 * 1024 * 1024 , "The size for the metric high watermarks (bytes)." )
2013-02-08 09:03:26 -08:00
labelNameToFingerprintsCacheSize = flag . Int ( "labelNameToFingerprintsCacheSizeBytes" , 100 * 1024 * 1024 , "The size for the label name to metric fingerprint index (bytes)." )
labelPairToFingerprintsCacheSize = flag . Int ( "labelPairToFingerprintsCacheSizeBytes" , 100 * 1024 * 1024 , "The size for the label pair to metric fingerprint index (bytes)." )
metricMembershipIndexCacheSize = flag . Int ( "metricMembershipCacheSizeBytes" , 50 * 1024 * 1024 , "The size for the metric membership index (bytes)." )
2013-04-28 05:47:43 -07:00
samplesByFingerprintCacheSize = flag . Int ( "samplesByFingerprintCacheSizeBytes" , 500 * 1024 * 1024 , "The size for the samples database (bytes)." )
2013-02-08 09:03:26 -08:00
)
type leveldbOpener func ( )
2013-04-01 04:22:38 -07:00
type leveldbCloser interface {
Close ( )
}
2013-02-08 09:03:26 -08:00
2013-04-01 04:22:38 -07:00
func ( l * LevelDBMetricPersistence ) Close ( ) {
var persistences = [ ] leveldbCloser {
2013-05-02 03:49:13 -07:00
l . CurationRemarks ,
2013-04-01 04:22:38 -07:00
l . fingerprintToMetrics ,
l . labelNameToFingerprints ,
l . labelSetToFingerprints ,
2013-05-02 03:49:13 -07:00
l . MetricHighWatermarks ,
2013-04-01 04:22:38 -07:00
l . metricMembershipIndex ,
2013-05-02 03:49:13 -07:00
l . MetricSamples ,
2013-02-08 09:03:26 -08:00
}
2013-04-01 04:22:38 -07:00
closerGroup := sync . WaitGroup { }
2013-02-08 09:03:26 -08:00
2013-04-01 04:22:38 -07:00
for _ , closer := range persistences {
closerGroup . Add ( 1 )
go func ( closer leveldbCloser ) {
2013-04-24 02:51:40 -07:00
if closer != nil {
closer . Close ( )
}
2013-04-01 04:22:38 -07:00
closerGroup . Done ( )
} ( closer )
2013-02-08 09:03:26 -08:00
}
2013-04-01 04:22:38 -07:00
closerGroup . Wait ( )
2013-02-08 09:03:26 -08:00
}
2013-04-28 05:47:43 -07:00
func NewLevelDBMetricPersistence ( baseDirectory string ) ( * LevelDBMetricPersistence , error ) {
workers := utility . NewUncertaintyGroup ( 7 )
2013-02-08 09:03:26 -08:00
emission := & LevelDBMetricPersistence { }
var subsystemOpeners = [ ] struct {
name string
opener leveldbOpener
} {
{
"Label Names and Value Pairs by Fingerprint" ,
func ( ) {
var err error
emission . fingerprintToMetrics , err = leveldb . NewLevelDBPersistence ( baseDirectory + "/label_name_and_value_pairs_by_fingerprint" , * fingerprintsToLabelPairCacheSize , 10 )
2013-04-28 05:47:43 -07:00
workers . MayFail ( err )
2013-02-08 09:03:26 -08:00
} ,
} ,
{
"Samples by Fingerprint" ,
func ( ) {
var err error
2013-05-02 03:49:13 -07:00
emission . MetricSamples , err = leveldb . NewLevelDBPersistence ( baseDirectory + "/samples_by_fingerprint" , * samplesByFingerprintCacheSize , 10 )
2013-04-28 05:47:43 -07:00
workers . MayFail ( err )
2013-02-08 09:03:26 -08:00
} ,
} ,
2013-03-14 19:24:28 -07:00
{
"High Watermarks by Fingerprint" ,
func ( ) {
var err error
2013-05-02 03:49:13 -07:00
emission . MetricHighWatermarks , err = leveldb . NewLevelDBPersistence ( baseDirectory + "/high_watermarks_by_fingerprint" , * highWatermarkCacheSize , 10 )
2013-04-28 05:47:43 -07:00
workers . MayFail ( err )
2013-03-14 19:24:28 -07:00
} ,
} ,
2013-02-08 09:03:26 -08:00
{
"Fingerprints by Label Name" ,
func ( ) {
var err error
emission . labelNameToFingerprints , err = leveldb . NewLevelDBPersistence ( baseDirectory + "/fingerprints_by_label_name" , * labelNameToFingerprintsCacheSize , 10 )
2013-04-28 05:47:43 -07:00
workers . MayFail ( err )
2013-02-08 09:03:26 -08:00
} ,
} ,
{
"Fingerprints by Label Name and Value Pair" ,
func ( ) {
var err error
emission . labelSetToFingerprints , err = leveldb . NewLevelDBPersistence ( baseDirectory + "/fingerprints_by_label_name_and_value_pair" , * labelPairToFingerprintsCacheSize , 10 )
2013-04-28 05:47:43 -07:00
workers . MayFail ( err )
2013-02-08 09:03:26 -08:00
} ,
} ,
{
"Metric Membership Index" ,
func ( ) {
var err error
emission . metricMembershipIndex , err = index . NewLevelDBMembershipIndex ( baseDirectory + "/metric_membership_index" , * metricMembershipIndexCacheSize , 10 )
2013-04-28 05:47:43 -07:00
workers . MayFail ( err )
} ,
} ,
{
"Sample Curation Remarks" ,
func ( ) {
var err error
2013-05-02 03:49:13 -07:00
emission . CurationRemarks , err = leveldb . NewLevelDBPersistence ( baseDirectory + "/curation_remarks" , * curationRemarksCacheSize , 10 )
2013-04-28 05:47:43 -07:00
workers . MayFail ( err )
2013-02-08 09:03:26 -08:00
} ,
} ,
}
for _ , subsystem := range subsystemOpeners {
opener := subsystem . opener
go opener ( )
}
2013-04-28 05:47:43 -07:00
if ! workers . Wait ( ) {
for _ , err := range workers . Errors ( ) {
log . Printf ( "Could not open storage due to %s" , err )
2013-02-08 09:03:26 -08:00
}
2013-04-28 05:47:43 -07:00
return nil , fmt . Errorf ( "Unable to open metric persistence." )
2013-02-08 09:03:26 -08:00
}
2013-04-28 05:47:43 -07:00
return emission , nil
2013-02-08 09:03:26 -08:00
}
func ( l * LevelDBMetricPersistence ) AppendSample ( sample model . Sample ) ( err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-11 14:21:25 -07:00
duration := time . Since ( begin )
2013-02-08 09:03:26 -08:00
2013-03-01 09:51:36 -08:00
recordOutcome ( duration , err , map [ string ] string { operation : appendSample , result : success } , map [ string ] string { operation : appendSample , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-02-08 09:03:26 -08:00
err = l . AppendSamples ( model . Samples { sample } )
return
}
2013-03-14 15:42:28 -07:00
// groupByFingerprint collects all of the provided samples, groups them
// together by their respective metric fingerprint, and finally sorts
// them chronologically.
func groupByFingerprint ( samples model . Samples ) map [ model . Fingerprint ] model . Samples {
2013-02-08 09:03:26 -08:00
var (
fingerprintToSamples = map [ model . Fingerprint ] model . Samples { }
)
for _ , sample := range samples {
fingerprint := model . NewFingerprintFromMetric ( sample . Metric )
samples := fingerprintToSamples [ fingerprint ]
samples = append ( samples , sample )
fingerprintToSamples [ fingerprint ] = samples
}
2013-03-04 11:43:07 -08:00
var (
sortingSemaphore = make ( chan bool , sortConcurrency )
2013-03-14 15:42:28 -07:00
doneSorting sync . WaitGroup
2013-03-04 11:43:07 -08:00
)
2013-03-14 15:42:28 -07:00
2013-02-08 09:03:26 -08:00
for i := 0 ; i < sortConcurrency ; i ++ {
sortingSemaphore <- true
}
for _ , samples := range fingerprintToSamples {
2013-03-04 11:43:07 -08:00
doneSorting . Add ( 1 )
2013-03-14 15:42:28 -07:00
2013-02-08 09:03:26 -08:00
go func ( samples model . Samples ) {
<- sortingSemaphore
sort . Sort ( samples )
sortingSemaphore <- true
2013-03-04 11:43:07 -08:00
doneSorting . Done ( )
2013-02-08 09:03:26 -08:00
} ( samples )
}
2013-03-04 11:43:07 -08:00
doneSorting . Wait ( )
2013-02-08 09:03:26 -08:00
2013-03-14 15:42:28 -07:00
return fingerprintToSamples
}
2013-03-07 11:01:32 -08:00
2013-03-14 16:55:50 -07:00
// findUnindexedMetrics scours the metric membership index for each given Metric
// in the keyspace and returns a map of Fingerprint-Metric pairs that are
// absent.
func ( l * LevelDBMetricPersistence ) findUnindexedMetrics ( candidates map [ model . Fingerprint ] model . Metric ) ( unindexed map [ model . Fingerprint ] model . Metric , err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-14 15:42:28 -07:00
duration := time . Since ( begin )
2013-03-07 11:01:32 -08:00
2013-03-14 16:55:50 -07:00
recordOutcome ( duration , err , map [ string ] string { operation : findUnindexedMetrics , result : success } , map [ string ] string { operation : findUnindexedMetrics , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-03-07 11:01:32 -08:00
2013-03-14 16:55:50 -07:00
unindexed = make ( map [ model . Fingerprint ] model . Metric )
2013-02-08 09:03:26 -08:00
// Determine which metrics are unknown in the database.
2013-03-14 16:55:50 -07:00
for fingerprint , metric := range candidates {
2013-04-05 09:03:45 -07:00
dto := model . MetricToDTO ( metric )
indexHas , err := l . hasIndexMetric ( dto )
2013-02-08 09:03:26 -08:00
if err != nil {
2013-04-05 09:03:45 -07:00
return unindexed , err
2013-02-08 09:03:26 -08:00
}
if ! indexHas {
2013-03-14 16:55:50 -07:00
unindexed [ fingerprint ] = metric
2013-02-08 09:03:26 -08:00
}
}
2013-03-14 16:55:50 -07:00
return
}
2013-03-14 17:19:45 -07:00
// indexLabelNames accumulates all label name to fingerprint index entries for
// the dirty metrics, appends the new dirtied metrics, sorts, and bulk updates
// the index to reflect the new state.
2013-03-14 17:38:34 -07:00
//
// This operation is idempotent.
2013-03-14 17:19:45 -07:00
func ( l * LevelDBMetricPersistence ) indexLabelNames ( metrics map [ model . Fingerprint ] model . Metric ) ( err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-14 16:55:50 -07:00
duration := time . Since ( begin )
2013-03-14 17:19:45 -07:00
recordOutcome ( duration , err , map [ string ] string { operation : indexLabelNames , result : success } , map [ string ] string { operation : indexLabelNames , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-03-14 16:55:50 -07:00
2013-03-14 17:19:45 -07:00
labelNameFingerprints := map [ model . LabelName ] utility . Set { }
2013-03-14 16:55:50 -07:00
2013-03-14 17:19:45 -07:00
for fingerprint , metric := range metrics {
for labelName := range metric {
fingerprintSet , ok := labelNameFingerprints [ labelName ]
if ! ok {
fingerprintSet = utility . Set { }
fingerprints , err := l . GetFingerprintsForLabelName ( labelName )
if err != nil {
return err
}
for _ , fingerprint := range fingerprints {
fingerprintSet . Add ( fingerprint )
}
}
fingerprintSet . Add ( fingerprint )
labelNameFingerprints [ labelName ] = fingerprintSet
}
2013-03-14 16:55:50 -07:00
}
2013-03-14 17:19:45 -07:00
batch := leveldb . NewBatch ( )
defer batch . Close ( )
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
for labelName , fingerprintSet := range labelNameFingerprints {
fingerprints := model . Fingerprints { }
for fingerprint := range fingerprintSet {
fingerprints = append ( fingerprints , fingerprint . ( model . Fingerprint ) )
}
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
sort . Sort ( fingerprints )
2013-03-06 19:04:51 -08:00
2013-03-14 17:19:45 -07:00
key := & dto . LabelName {
Name : proto . String ( string ( labelName ) ) ,
}
value := & dto . FingerprintCollection { }
for _ , fingerprint := range fingerprints {
value . Member = append ( value . Member , fingerprint . ToDTO ( ) )
2013-02-08 09:03:26 -08:00
}
2013-04-05 04:07:13 -07:00
batch . Put ( coding . NewProtocolBuffer ( key ) , coding . NewProtocolBuffer ( value ) )
2013-03-14 17:19:45 -07:00
}
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
err = l . labelNameToFingerprints . Commit ( batch )
if err != nil {
return
}
return
}
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
// indexLabelPairs accumulates all label pair to fingerprint index entries for
// the dirty metrics, appends the new dirtied metrics, sorts, and bulk updates
// the index to reflect the new state.
2013-03-14 17:38:34 -07:00
//
// This operation is idempotent.
2013-03-14 17:19:45 -07:00
func ( l * LevelDBMetricPersistence ) indexLabelPairs ( metrics map [ model . Fingerprint ] model . Metric ) ( err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-14 17:19:45 -07:00
duration := time . Since ( begin )
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
recordOutcome ( duration , err , map [ string ] string { operation : indexLabelPairs , result : success } , map [ string ] string { operation : indexLabelPairs , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-03-14 17:19:45 -07:00
labelPairFingerprints := map [ model . LabelPair ] utility . Set { }
for fingerprint , metric := range metrics {
for labelName , labelValue := range metric {
labelPair := model . LabelPair {
Name : labelName ,
Value : labelValue ,
2013-02-08 09:03:26 -08:00
}
2013-03-14 17:19:45 -07:00
fingerprintSet , ok := labelPairFingerprints [ labelPair ]
if ! ok {
fingerprintSet = utility . Set { }
fingerprints , err := l . GetFingerprintsForLabelSet ( model . LabelSet {
labelName : labelValue ,
} )
if err != nil {
return err
}
for _ , fingerprint := range fingerprints {
fingerprintSet . Add ( fingerprint )
}
2013-02-08 09:03:26 -08:00
}
2013-03-14 17:19:45 -07:00
fingerprintSet . Add ( fingerprint )
labelPairFingerprints [ labelPair ] = fingerprintSet
2013-02-08 09:03:26 -08:00
}
2013-03-14 17:19:45 -07:00
}
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
batch := leveldb . NewBatch ( )
defer batch . Close ( )
for labelPair , fingerprintSet := range labelPairFingerprints {
fingerprints := model . Fingerprints { }
for fingerprint := range fingerprintSet {
fingerprints = append ( fingerprints , fingerprint . ( model . Fingerprint ) )
2013-02-08 09:03:26 -08:00
}
2013-03-14 17:19:45 -07:00
sort . Sort ( fingerprints )
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
key := & dto . LabelPair {
Name : proto . String ( string ( labelPair . Name ) ) ,
Value : proto . String ( string ( labelPair . Value ) ) ,
}
value := & dto . FingerprintCollection { }
for _ , fingerprint := range fingerprints {
value . Member = append ( value . Member , fingerprint . ToDTO ( ) )
}
2013-02-08 09:03:26 -08:00
2013-04-05 04:07:13 -07:00
batch . Put ( coding . NewProtocolBuffer ( key ) , coding . NewProtocolBuffer ( value ) )
2013-03-14 17:19:45 -07:00
}
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
err = l . labelSetToFingerprints . Commit ( batch )
if err != nil {
return
}
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
return
}
2013-02-08 09:03:26 -08:00
2013-03-14 17:38:34 -07:00
// indexFingerprints updates all of the Fingerprint to Metric reverse lookups
// in the index and then bulk updates.
//
// This operation is idempotent.
func ( l * LevelDBMetricPersistence ) indexFingerprints ( metrics map [ model . Fingerprint ] model . Metric ) ( err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-14 17:38:34 -07:00
duration := time . Since ( begin )
recordOutcome ( duration , err , map [ string ] string { operation : indexFingerprints , result : success } , map [ string ] string { operation : indexFingerprints , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-03-14 17:38:34 -07:00
batch := leveldb . NewBatch ( )
defer batch . Close ( )
for fingerprint , metric := range metrics {
2013-04-05 04:07:13 -07:00
key := coding . NewProtocolBuffer ( fingerprint . ToDTO ( ) )
value := coding . NewProtocolBuffer ( model . MetricToDTO ( metric ) )
2013-03-14 17:38:34 -07:00
batch . Put ( key , value )
}
err = l . fingerprintToMetrics . Commit ( batch )
if err != nil {
2013-04-05 09:03:45 -07:00
return
2013-03-14 17:38:34 -07:00
}
return
}
2013-03-14 17:19:45 -07:00
// indexMetrics takes groups of samples, determines which ones contain metrics
// that are unknown to the storage stack, and then proceeds to update all
// affected indices.
func ( l * LevelDBMetricPersistence ) indexMetrics ( fingerprints map [ model . Fingerprint ] model . Metric ) ( err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-14 17:19:45 -07:00
duration := time . Since ( begin )
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
recordOutcome ( duration , err , map [ string ] string { operation : indexMetrics , result : success } , map [ string ] string { operation : indexMetrics , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
var (
absentMetrics map [ model . Fingerprint ] model . Metric
)
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
absentMetrics , err = l . findUnindexedMetrics ( fingerprints )
if err != nil {
2013-04-05 09:03:45 -07:00
return
2013-03-14 17:19:45 -07:00
}
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
if len ( absentMetrics ) == 0 {
return
}
2013-02-08 09:03:26 -08:00
2013-03-14 17:19:45 -07:00
// TODO: For the missing fingerprints, determine what label names and pairs
// are absent and act accordingly and append fingerprints.
2013-04-28 05:47:43 -07:00
workers := utility . NewUncertaintyGroup ( 3 )
2013-03-14 17:19:45 -07:00
go func ( ) {
2013-04-28 05:47:43 -07:00
workers . MayFail ( l . indexLabelNames ( absentMetrics ) )
2013-03-14 17:19:45 -07:00
} ( )
go func ( ) {
2013-04-28 05:47:43 -07:00
workers . MayFail ( l . indexLabelPairs ( absentMetrics ) )
2013-02-08 09:03:26 -08:00
} ( )
2013-03-14 17:38:34 -07:00
go func ( ) {
2013-04-28 05:47:43 -07:00
workers . MayFail ( l . indexFingerprints ( absentMetrics ) )
2013-03-14 17:38:34 -07:00
} ( )
2013-04-28 05:47:43 -07:00
if ! workers . Wait ( ) {
return fmt . Errorf ( "Could not index due to %s" , workers . Errors ( ) )
2013-02-08 09:03:26 -08:00
}
2013-03-14 17:38:34 -07:00
// If any of the preceding operations failed, we will have inconsistent
// indices. Thusly, the Metric membership index should NOT be updated, as
// its state is used to determine whether to bulk update the other indices.
// Given that those operations are idempotent, it is OK to repeat them;
// however, it will consume considerable amounts of time.
2013-04-05 09:03:45 -07:00
batch := leveldb . NewBatch ( )
defer batch . Close ( )
2013-02-08 09:03:26 -08:00
2013-04-05 09:03:45 -07:00
// WART: We should probably encode simple fingerprints.
for _ , metric := range absentMetrics {
key := coding . NewProtocolBuffer ( model . MetricToDTO ( metric ) )
batch . Put ( key , key )
}
err = l . metricMembershipIndex . Commit ( batch )
if err != nil {
2013-04-28 05:47:43 -07:00
// Not critical but undesirable.
log . Println ( err )
2013-02-08 09:03:26 -08:00
}
2013-03-14 15:42:28 -07:00
return
}
2013-03-14 19:24:28 -07:00
func ( l * LevelDBMetricPersistence ) refreshHighWatermarks ( groups map [ model . Fingerprint ] model . Samples ) ( err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-14 19:24:28 -07:00
duration := time . Since ( begin )
recordOutcome ( duration , err , map [ string ] string { operation : refreshHighWatermarks , result : success } , map [ string ] string { operation : refreshHighWatermarks , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-03-14 19:24:28 -07:00
batch := leveldb . NewBatch ( )
defer batch . Close ( )
2013-04-05 09:03:45 -07:00
mutationCount := 0
2013-03-14 19:24:28 -07:00
for fingerprint , samples := range groups {
2013-04-05 09:03:45 -07:00
key := & dto . Fingerprint { }
value := & dto . MetricHighWatermark { }
raw := [ ] byte { }
newestSampleTimestamp := samples [ len ( samples ) - 1 ] . Timestamp
keyEncoded := coding . NewProtocolBuffer ( key )
2013-03-14 19:24:28 -07:00
key . Signature = proto . String ( fingerprint . ToRowKey ( ) )
2013-05-02 03:49:13 -07:00
raw , err = l . MetricHighWatermarks . Get ( keyEncoded )
2013-03-14 19:24:28 -07:00
if err != nil {
return
}
if raw != nil {
err = proto . Unmarshal ( raw , value )
if err != nil {
2013-04-05 09:03:45 -07:00
return
2013-03-14 19:24:28 -07:00
}
2013-03-26 03:56:10 -07:00
if newestSampleTimestamp . Before ( time . Unix ( * value . Timestamp , 0 ) ) {
2013-03-14 19:24:28 -07:00
continue
}
}
2013-03-26 03:56:10 -07:00
value . Timestamp = proto . Int64 ( newestSampleTimestamp . Unix ( ) )
2013-04-05 04:07:13 -07:00
batch . Put ( keyEncoded , coding . NewProtocolBuffer ( value ) )
2013-03-14 19:24:28 -07:00
mutationCount ++
}
2013-05-02 03:49:13 -07:00
err = l . MetricHighWatermarks . Commit ( batch )
2013-03-14 19:24:28 -07:00
if err != nil {
2013-04-05 09:03:45 -07:00
return
2013-03-14 19:24:28 -07:00
}
return
}
2013-03-14 15:42:28 -07:00
func ( l * LevelDBMetricPersistence ) AppendSamples ( samples model . Samples ) ( err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-14 15:42:28 -07:00
duration := time . Since ( begin )
recordOutcome ( duration , err , map [ string ] string { operation : appendSamples , result : success } , map [ string ] string { operation : appendSamples , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-03-14 15:42:28 -07:00
var (
fingerprintToSamples = groupByFingerprint ( samples )
2013-05-03 03:13:05 -07:00
indexErrChan = make ( chan error , 1 )
watermarkErrChan = make ( chan error , 1 )
2013-03-14 15:42:28 -07:00
)
go func ( groups map [ model . Fingerprint ] model . Samples ) {
2013-03-14 16:55:50 -07:00
var (
metrics = map [ model . Fingerprint ] model . Metric { }
)
for fingerprint , samples := range groups {
metrics [ fingerprint ] = samples [ 0 ] . Metric
}
indexErrChan <- l . indexMetrics ( metrics )
2013-03-14 15:42:28 -07:00
} ( fingerprintToSamples )
2013-03-14 19:24:28 -07:00
go func ( groups map [ model . Fingerprint ] model . Samples ) {
watermarkErrChan <- l . refreshHighWatermarks ( groups )
} ( fingerprintToSamples )
2013-03-14 18:09:19 -07:00
samplesBatch := leveldb . NewBatch ( )
defer samplesBatch . Close ( )
2013-03-14 15:42:28 -07:00
2013-03-14 18:09:19 -07:00
for fingerprint , group := range fingerprintToSamples {
for {
lengthOfGroup := len ( group )
2013-03-14 15:42:28 -07:00
2013-03-14 18:09:19 -07:00
if lengthOfGroup == 0 {
break
}
2013-03-14 15:42:28 -07:00
2013-03-14 18:09:19 -07:00
take := * leveldbChunkSize
if lengthOfGroup < take {
take = lengthOfGroup
}
2013-03-14 15:42:28 -07:00
2013-03-14 18:09:19 -07:00
chunk := group [ 0 : take ]
group = group [ take : lengthOfGroup ]
2013-03-14 15:42:28 -07:00
2013-04-21 10:16:15 -07:00
key := model . SampleKey {
Fingerprint : fingerprint ,
FirstTimestamp : chunk [ 0 ] . Timestamp ,
LastTimestamp : chunk [ take - 1 ] . Timestamp ,
SampleCount : uint32 ( take ) ,
} . ToDTO ( )
2013-03-14 15:42:28 -07:00
2013-03-14 18:09:19 -07:00
value := & dto . SampleValueSeries { }
for _ , sample := range chunk {
value . Value = append ( value . Value , & dto . SampleValueSeries_Value {
Timestamp : proto . Int64 ( sample . Timestamp . Unix ( ) ) ,
2013-04-21 09:15:56 -07:00
Value : sample . Value . ToDTO ( ) ,
2013-03-14 18:09:19 -07:00
} )
2013-03-14 15:42:28 -07:00
}
2013-03-14 18:09:19 -07:00
2013-04-05 04:07:13 -07:00
samplesBatch . Put ( coding . NewProtocolBuffer ( key ) , coding . NewProtocolBuffer ( value ) )
2013-03-14 15:42:28 -07:00
}
2013-03-14 18:09:19 -07:00
}
2013-03-14 15:42:28 -07:00
2013-05-02 03:49:13 -07:00
err = l . MetricSamples . Commit ( samplesBatch )
2013-03-14 18:09:19 -07:00
if err != nil {
2013-04-05 09:03:45 -07:00
return
2013-03-14 18:09:19 -07:00
}
2013-03-14 15:42:28 -07:00
err = <- indexErrChan
if err != nil {
2013-04-05 09:03:45 -07:00
return
2013-03-14 15:42:28 -07:00
}
2013-02-08 09:03:26 -08:00
2013-03-14 19:24:28 -07:00
err = <- watermarkErrChan
if err != nil {
2013-04-05 09:03:45 -07:00
return
2013-03-14 19:24:28 -07:00
}
2013-02-08 09:03:26 -08:00
return
}
2013-04-21 10:16:15 -07:00
func extractSampleKey ( i leveldb . Iterator ) ( key model . SampleKey , err error ) {
k := & dto . SampleKey { }
err = proto . Unmarshal ( i . Key ( ) , k )
if err != nil {
return
2013-03-06 18:16:20 -08:00
}
2013-04-21 10:16:15 -07:00
key = model . NewSampleKeyFromDTO ( k )
2012-12-25 04:50:36 -08:00
return
}
2013-04-22 04:30:16 -07:00
func extractSampleValues ( i leveldb . Iterator ) ( values model . Values , err error ) {
v := & dto . SampleValueSeries { }
2012-12-25 04:50:36 -08:00
err = proto . Unmarshal ( i . Value ( ) , v )
2013-04-22 04:30:16 -07:00
if err != nil {
return
}
values = model . NewValuesFromDTO ( v )
2012-12-25 04:50:36 -08:00
return
}
func fingerprintsEqual ( l * dto . Fingerprint , r * dto . Fingerprint ) bool {
if l == r {
return true
}
if l == nil && r == nil {
return true
}
if r . Signature == l . Signature {
return true
}
if * r . Signature == * l . Signature {
return true
}
return false
}
2013-01-23 08:18:45 -08:00
func ( l * LevelDBMetricPersistence ) hasIndexMetric ( dto * dto . Metric ) ( value bool , err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-11 14:21:25 -07:00
duration := time . Since ( begin )
2013-01-23 08:18:45 -08:00
2013-03-01 09:51:36 -08:00
recordOutcome ( duration , err , map [ string ] string { operation : hasIndexMetric , result : success } , map [ string ] string { operation : hasIndexMetric , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-01-23 08:18:45 -08:00
2013-04-05 04:07:13 -07:00
dtoKey := coding . NewProtocolBuffer ( dto )
2013-01-23 08:18:45 -08:00
value , err = l . metricMembershipIndex . Has ( dtoKey )
return
2012-12-09 07:27:12 -08:00
}
2013-01-23 08:18:45 -08:00
func ( l * LevelDBMetricPersistence ) HasLabelPair ( dto * dto . LabelPair ) ( value bool , err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-11 14:21:25 -07:00
duration := time . Since ( begin )
2013-01-23 08:18:45 -08:00
2013-03-01 09:51:36 -08:00
recordOutcome ( duration , err , map [ string ] string { operation : hasLabelPair , result : success } , map [ string ] string { operation : hasLabelPair , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-01-23 08:18:45 -08:00
2013-04-05 04:07:13 -07:00
dtoKey := coding . NewProtocolBuffer ( dto )
2013-01-23 08:18:45 -08:00
value , err = l . labelSetToFingerprints . Has ( dtoKey )
return
2012-12-09 07:27:12 -08:00
}
2013-01-23 08:18:45 -08:00
func ( l * LevelDBMetricPersistence ) HasLabelName ( dto * dto . LabelName ) ( value bool , err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-11 14:21:25 -07:00
duration := time . Since ( begin )
2013-01-23 08:18:45 -08:00
2013-03-01 09:51:36 -08:00
recordOutcome ( duration , err , map [ string ] string { operation : hasLabelName , result : success } , map [ string ] string { operation : hasLabelName , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2013-01-23 08:18:45 -08:00
2013-04-05 04:07:13 -07:00
dtoKey := coding . NewProtocolBuffer ( dto )
2013-01-23 08:18:45 -08:00
value , err = l . labelNameToFingerprints . Has ( dtoKey )
return
2012-12-09 07:27:12 -08:00
}
2013-02-08 09:03:26 -08:00
func ( l * LevelDBMetricPersistence ) GetFingerprintsForLabelSet ( labelSet model . LabelSet ) ( fps model . Fingerprints , err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-11 14:21:25 -07:00
duration := time . Since ( begin )
2012-12-09 07:27:12 -08:00
2013-03-01 09:51:36 -08:00
recordOutcome ( duration , err , map [ string ] string { operation : getFingerprintsForLabelSet , result : success } , map [ string ] string { operation : getFingerprintsForLabelSet , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2012-12-09 07:27:12 -08:00
2013-01-13 02:15:01 -08:00
sets := [ ] utility . Set { }
2012-12-09 07:27:12 -08:00
2013-02-13 17:13:41 -08:00
for _ , labelSetDTO := range model . LabelSetToDTOs ( & labelSet ) {
2013-04-05 04:07:13 -07:00
f , err := l . labelSetToFingerprints . Get ( coding . NewProtocolBuffer ( labelSetDTO ) )
2012-12-25 04:50:36 -08:00
if err != nil {
return fps , err
}
unmarshaled := & dto . FingerprintCollection { }
err = proto . Unmarshal ( f , unmarshaled )
if err != nil {
return fps , err
}
2013-01-13 02:15:01 -08:00
set := utility . Set { }
2012-12-25 04:50:36 -08:00
for _ , m := range unmarshaled . Member {
2013-02-08 09:03:26 -08:00
fp := model . NewFingerprintFromRowKey ( * m . Signature )
2013-01-13 02:15:01 -08:00
set . Add ( fp )
2012-12-09 07:27:12 -08:00
}
2013-01-13 02:15:01 -08:00
sets = append ( sets , set )
}
numberOfSets := len ( sets )
if numberOfSets == 0 {
return
}
base := sets [ 0 ]
for i := 1 ; i < numberOfSets ; i ++ {
base = base . Intersection ( sets [ i ] )
}
for _ , e := range base . Elements ( ) {
fingerprint := e . ( model . Fingerprint )
2013-02-14 08:07:59 -08:00
fps = append ( fps , fingerprint )
2012-12-09 07:27:12 -08:00
}
2012-12-25 04:50:36 -08:00
return
2012-12-09 07:27:12 -08:00
}
2013-02-08 09:03:26 -08:00
func ( l * LevelDBMetricPersistence ) GetFingerprintsForLabelName ( labelName model . LabelName ) ( fps model . Fingerprints , err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-11 14:21:25 -07:00
duration := time . Since ( begin )
2012-12-09 07:27:12 -08:00
2013-03-01 09:51:36 -08:00
recordOutcome ( duration , err , map [ string ] string { operation : getFingerprintsForLabelName , result : success } , map [ string ] string { operation : getFingerprintsForLabelName , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2012-12-09 07:27:12 -08:00
2013-04-05 04:07:13 -07:00
raw , err := l . labelNameToFingerprints . Get ( coding . NewProtocolBuffer ( model . LabelNameToDTO ( & labelName ) ) )
2012-12-25 04:50:36 -08:00
if err != nil {
return
2012-12-09 07:27:12 -08:00
}
2012-12-25 04:50:36 -08:00
unmarshaled := & dto . FingerprintCollection { }
err = proto . Unmarshal ( raw , unmarshaled )
if err != nil {
return
}
for _ , m := range unmarshaled . Member {
2013-02-08 09:03:26 -08:00
fp := model . NewFingerprintFromRowKey ( * m . Signature )
2013-02-14 08:19:41 -08:00
fps = append ( fps , fp )
2012-12-25 04:50:36 -08:00
}
return
2012-12-09 07:27:12 -08:00
}
2013-02-08 09:03:26 -08:00
func ( l * LevelDBMetricPersistence ) GetMetricForFingerprint ( f model . Fingerprint ) ( m * model . Metric , err error ) {
2013-04-05 09:03:45 -07:00
defer func ( begin time . Time ) {
2013-03-11 14:21:25 -07:00
duration := time . Since ( begin )
2012-12-25 04:50:36 -08:00
2013-03-01 09:51:36 -08:00
recordOutcome ( duration , err , map [ string ] string { operation : getMetricForFingerprint , result : success } , map [ string ] string { operation : getMetricForFingerprint , result : failure } )
2013-04-05 09:03:45 -07:00
} ( time . Now ( ) )
2012-12-25 04:50:36 -08:00
2013-04-05 04:07:13 -07:00
raw , err := l . fingerprintToMetrics . Get ( coding . NewProtocolBuffer ( model . FingerprintToDTO ( f ) ) )
2012-12-25 04:50:36 -08:00
if err != nil {
return
2012-12-09 07:27:12 -08:00
}
2012-12-25 04:50:36 -08:00
unmarshaled := & dto . Metric { }
err = proto . Unmarshal ( raw , unmarshaled )
if err != nil {
return
}
2013-02-08 09:03:26 -08:00
metric := model . Metric { }
2013-02-14 08:43:02 -08:00
2012-12-25 04:50:36 -08:00
for _ , v := range unmarshaled . LabelPair {
2013-02-08 09:03:26 -08:00
metric [ model . LabelName ( * v . Name ) ] = model . LabelValue ( * v . Value )
2012-12-25 04:50:36 -08:00
}
2012-12-12 03:53:34 -08:00
2013-02-08 09:03:26 -08:00
// Explicit address passing here shaves immense amounts of time off of the
// code flow due to less tight-loop dereferencing.
m = & metric
2012-12-25 04:50:36 -08:00
return
2012-12-12 03:53:34 -08:00
}
2013-04-18 16:00:57 -07:00
func ( l LevelDBMetricPersistence ) GetValueAtTime ( f model . Fingerprint , t time . Time ) ( samples model . Values ) {
2013-04-18 07:10:52 -07:00
panic ( "Not implemented" )
2012-12-12 03:53:34 -08:00
}
2013-04-18 16:00:57 -07:00
func ( l LevelDBMetricPersistence ) GetBoundaryValues ( f model . Fingerprint , i model . Interval ) ( first model . Values , second model . Values ) {
2013-04-18 07:10:52 -07:00
panic ( "Not implemented" )
2012-12-19 11:34:54 -08:00
}
2013-04-18 16:00:57 -07:00
func ( l * LevelDBMetricPersistence ) GetRangeValues ( f model . Fingerprint , i model . Interval ) ( samples model . Values ) {
2013-04-18 07:10:52 -07:00
panic ( "Not implemented" )
2012-12-12 03:53:34 -08:00
}
2013-02-06 08:06:39 -08:00
type MetricKeyDecoder struct { }
func ( d * MetricKeyDecoder ) DecodeKey ( in interface { } ) ( out interface { } , err error ) {
2013-03-26 06:46:02 -07:00
unmarshaled := dto . LabelPair { }
err = proto . Unmarshal ( in . ( [ ] byte ) , & unmarshaled )
2013-02-06 08:06:39 -08:00
if err != nil {
return
}
2013-02-08 09:03:26 -08:00
2013-03-26 06:46:02 -07:00
out = model . LabelPair {
Name : model . LabelName ( * unmarshaled . Name ) ,
Value : model . LabelValue ( * unmarshaled . Value ) ,
}
2013-02-08 09:03:26 -08:00
return
2013-02-06 08:06:39 -08:00
}
func ( d * MetricKeyDecoder ) DecodeValue ( in interface { } ) ( out interface { } , err error ) {
return
}
2013-03-26 03:45:56 -07:00
type LabelNameFilter struct {
labelName model . LabelName
}
2013-02-06 08:06:39 -08:00
2013-03-26 06:46:02 -07:00
func ( f LabelNameFilter ) Filter ( key , value interface { } ) ( filterResult storage . FilterResult ) {
labelPair , ok := key . ( model . LabelPair )
if ok && labelPair . Name == f . labelName {
2013-02-07 02:38:01 -08:00
return storage . ACCEPT
}
return storage . SKIP
2013-02-06 08:06:39 -08:00
}
2013-03-26 03:45:56 -07:00
type CollectLabelValuesOp struct {
labelValues [ ] model . LabelValue
2013-02-06 08:06:39 -08:00
}
2013-03-26 03:45:56 -07:00
func ( op * CollectLabelValuesOp ) Operate ( key , value interface { } ) ( err * storage . OperatorError ) {
2013-03-26 06:46:02 -07:00
labelPair := key . ( model . LabelPair )
op . labelValues = append ( op . labelValues , model . LabelValue ( labelPair . Value ) )
2013-02-06 08:06:39 -08:00
return
}
2013-03-26 03:45:56 -07:00
func ( l * LevelDBMetricPersistence ) GetAllValuesForLabel ( labelName model . LabelName ) ( values model . LabelValues , err error ) {
filter := & LabelNameFilter {
labelName : labelName ,
}
labelValuesOp := & CollectLabelValuesOp { }
2013-02-06 08:06:39 -08:00
2013-03-26 03:45:56 -07:00
_ , err = l . labelSetToFingerprints . ForEach ( & MetricKeyDecoder { } , filter , labelValuesOp )
2013-02-06 08:06:39 -08:00
if err != nil {
return
}
2013-03-26 03:45:56 -07:00
values = labelValuesOp . labelValues
2013-02-06 08:06:39 -08:00
return
}
2013-02-08 09:03:26 -08:00
func ( l * LevelDBMetricPersistence ) ForEachSample ( builder IteratorsForFingerprintBuilder ) ( err error ) {
panic ( "not implemented" )
}
2013-05-10 07:41:02 -07:00
// CompactKeyspace compacts each database's keyspace serially. An error may
// be returned if there are difficulties with the underlying database or if
// it's empty.
//
// Beware that it would probably be imprudent to run this on a live user-facing
// server due to latency implications.
func ( l * LevelDBMetricPersistence ) CompactKeyspaces ( ) error {
if err := l . CurationRemarks . CompactKeyspace ( ) ; err != nil {
return fmt . Errorf ( "Could not compact curation remarks: %s" , err )
}
if err := l . fingerprintToMetrics . CompactKeyspace ( ) ; err != nil {
return fmt . Errorf ( "Could not compact fingerprint to metric index: %s" , err )
}
if err := l . labelNameToFingerprints . CompactKeyspace ( ) ; err != nil {
return fmt . Errorf ( "Could not compact label name to fingerprint index: %s" , err )
}
if err := l . labelSetToFingerprints . CompactKeyspace ( ) ; err != nil {
return fmt . Errorf ( "Could not compact label pair to fingerprint index: %s" , err )
}
if err := l . MetricHighWatermarks . CompactKeyspace ( ) ; err != nil {
return fmt . Errorf ( "Could not compact metric high watermarks: %s" , err )
}
if err := l . metricMembershipIndex . CompactKeyspace ( ) ; err != nil {
return fmt . Errorf ( "Could not compact metric membership index: %s" , err )
}
if err := l . MetricSamples . CompactKeyspace ( ) ; err != nil {
return fmt . Errorf ( "Could not compact metric samples database: %s" , err )
}
return nil
}