prometheus/wal/wal_test.go

// Copyright 2017 The Prometheus Authors

// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

package wal

import (
	"bytes"
	"encoding/binary"
	"hash/crc32"
	"io/ioutil"
	"math/rand"
	"os"
	"testing"

	"github.com/pkg/errors"
	"github.com/prometheus/tsdb/testutil"
)

func encodedRecord(t recType, b []byte) []byte {
	if t == recPageTerm {
		return append([]byte{0}, b...)
	}
	r := make([]byte, recordHeaderSize)
	r[0] = byte(t)
	binary.BigEndian.PutUint16(r[1:], uint16(len(b)))
	binary.BigEndian.PutUint32(r[3:], crc32.Checksum(b, castagnoliTable))
	return append(r, b...)
}

// TestReader feeds the reader a stream of encoded records with different types.
func TestReader(t *testing.T) {
	data := make([]byte, 100000)
	_, err := rand.Read(data)
	testutil.Ok(t, err)

	type record struct {
		t recType
		b []byte
	}
	cases := []struct {
		t    []record
		exp  [][]byte
		fail bool
	}{
		// Sequence of valid records.
		{
			t: []record{
				{recFull, data[0:200]},
				{recFirst, data[200:300]},
				{recLast, data[300:400]},
				{recFirst, data[400:800]},
				{recMiddle, data[800:900]},
				{recPageTerm, make([]byte, pageSize-900-recordHeaderSize*5-1)}, // exactly lines up with page boundary.
				{recLast, data[900:900]},
				{recFirst, data[900:1000]},
				{recMiddle, data[1000:1200]},
				{recMiddle, data[1200:30000]},
				{recMiddle, data[30000:30001]},
				{recMiddle, data[30001:30001]},
				{recLast, data[30001:32000]},
			},
			exp: [][]byte{
				data[0:200],
				data[200:400],
				data[400:900],
				data[900:32000],
			},
		},
		// Exactly at the limit of one page minus the header size
		{
			t: []record{
				{recFull, data[0 : pageSize-recordHeaderSize]},
			},
			exp: [][]byte{
				data[:pageSize-recordHeaderSize],
			},
		},
		// More than a full page, this exceeds our buffer and can never happen
		// when written by the WAL.
		{
			t: []record{
				{recFull, data[0 : pageSize+1]},
			},
			fail: true,
		},
		// Invalid orders of record types.
		{
			t:    []record{{recMiddle, data[:200]}},
			fail: true,
		},
		{
			t:    []record{{recLast, data[:200]}},
			fail: true,
		},
		{
			t: []record{
				{recFirst, data[:200]},
				{recFull, data[200:400]},
			},
			fail: true,
		},
		{
			t: []record{
				{recFirst, data[:100]},
				{recMiddle, data[100:200]},
				{recFull, data[200:400]},
			},
			fail: true,
		},
		// Non-zero data after page termination.
		{
			t: []record{
				{recFull, data[:100]},
				{recPageTerm, append(make([]byte, 1000), 1)},
			},
			exp:  [][]byte{data[:100]},
			fail: true,
		},
	}
	for i, c := range cases {
		t.Logf("test %d", i)

		var buf []byte
		for _, r := range c.t {
			buf = append(buf, encodedRecord(r.t, r.b)...)
		}
		r := NewReader(bytes.NewReader(buf))

		for j := 0; r.Next(); j++ {
			t.Logf("record %d", j)
			rec := r.Record()

			if j >= len(c.exp) {
				t.Fatal("received more records than inserted")
			}
			testutil.Equals(t, c.exp[j], rec, "Bytes within record did not match expected Bytes")
		}
		if !c.fail && r.Err() != nil {
			t.Fatalf("unexpected error: %s", r.Err())
		}
		if c.fail && r.Err() == nil {
			t.Fatalf("expected error but got none")
		}
	}
}

func TestWAL_FuzzWriteRead(t *testing.T) {
	const count = 25000

	dir, err := ioutil.TempDir("", "walfuzz")
	testutil.Ok(t, err)
	defer os.RemoveAll(dir)

	w, err := NewSize(nil, nil, dir, 128*pageSize)
	testutil.Ok(t, err)

	var input [][]byte
	var recs [][]byte

	for i := 0; i < count; i++ {
		var sz int
		switch i % 5 {
		case 0, 1:
			sz = 50
		case 2, 3:
			sz = pageSize
		default:
			sz = 8 * pageSize
		}
		rec := make([]byte, rand.Intn(sz))
		_, err := rand.Read(rec)
		testutil.Ok(t, err)

		input = append(input, rec)
		recs = append(recs, rec)

		// Randomly batch up records.
		if rand.Intn(4) < 3 {
			testutil.Ok(t, w.Log(recs...))
			recs = recs[:0]
		}
	}
	testutil.Ok(t, w.Log(recs...))

	m, n, err := w.Segments()
	testutil.Ok(t, err)

	rc, err := NewSegmentsRangeReader(SegmentRange{Dir: dir, First: m, Last: n})
	testutil.Ok(t, err)
	defer rc.Close()

	rdr := NewReader(rc)

	for i := 0; rdr.Next(); i++ {
		rec := rdr.Record()
		if i >= len(input) {
			t.Fatal("read too many records")
		}
		if !bytes.Equal(input[i], rec) {
			t.Fatalf("record %d (len %d) does not match (expected len %d)",
				i, len(rec), len(input[i]))
		}
	}
	testutil.Ok(t, rdr.Err())
}

func TestWAL_Repair(t *testing.T) {

	for name, test := range map[string]struct {
		corrSgm    int              // Which segment to corrupt.
		corrFunc   func(f *os.File) // Func that applies the corruption.
		intactRecs int              // Total expected records left after the repair.
	}{
		"torn_last_record": {
			2,
			func(f *os.File) {
				_, err := f.Seek(pageSize*2, 0)
				testutil.Ok(t, err)
				_, err = f.Write([]byte{byte(recFirst)})
				testutil.Ok(t, err)
			},
			8,
		},
		// Ensures that the page buffer is big enough to fit
		// an entire page size without panicing.
		// https://github.com/prometheus/tsdb/pull/414
		"bad_header": {
			1,
			func(f *os.File) {
				_, err := f.Seek(pageSize, 0)
				testutil.Ok(t, err)
				_, err = f.Write([]byte{byte(recPageTerm)})
				testutil.Ok(t, err)
			},
			4,
		},
		"bad_fragment_sequence": {
			1,
			func(f *os.File) {
				_, err := f.Seek(pageSize, 0)
				testutil.Ok(t, err)
				_, err = f.Write([]byte{byte(recLast)})
				testutil.Ok(t, err)
			},
			4,
		},
		"bad_fragment_flag": {
			1,
			func(f *os.File) {
				_, err := f.Seek(pageSize, 0)
				testutil.Ok(t, err)
				_, err = f.Write([]byte{123})
				testutil.Ok(t, err)
			},
			4,
		},
		"bad_checksum": {
			1,
			func(f *os.File) {
				_, err := f.Seek(pageSize+4, 0)
				testutil.Ok(t, err)
				_, err = f.Write([]byte{0})
				testutil.Ok(t, err)
			},
			4,
		},
		"bad_length": {
			1,
			func(f *os.File) {
				_, err := f.Seek(pageSize+2, 0)
				testutil.Ok(t, err)
				_, err = f.Write([]byte{0})
				testutil.Ok(t, err)
			},
			4,
		},
		"bad_content": {
			1,
			func(f *os.File) {
				_, err := f.Seek(pageSize+100, 0)
				testutil.Ok(t, err)
				_, err = f.Write([]byte("beef"))
				testutil.Ok(t, err)
			},
			4,
		},
	} {
		t.Run(name, func(t *testing.T) {
			dir, err := ioutil.TempDir("", "wal_repair")
			testutil.Ok(t, err)
			defer os.RemoveAll(dir)

			// We create 3 segments with 3 records each and
			// then corrupt a given record in a given segment.
			// As a result we want a repaired WAL with given intact records.
			w, err := NewSize(nil, nil, dir, 3*pageSize)
			testutil.Ok(t, err)

			var records [][]byte

			for i := 1; i <= 9; i++ {
				b := make([]byte, pageSize-recordHeaderSize)
				b[0] = byte(i)
				records = append(records, b)
				testutil.Ok(t, w.Log(b))
			}
			testutil.Ok(t, w.Close())

			f, err := os.OpenFile(SegmentName(dir, test.corrSgm), os.O_RDWR, 0666)
			testutil.Ok(t, err)

			// Apply corruption function.
			test.corrFunc(f)

			testutil.Ok(t, f.Close())

			w, err = New(nil, nil, dir)
			testutil.Ok(t, err)

			sr, err := NewSegmentsReader(dir)
			testutil.Ok(t, err)
			r := NewReader(sr)

			for r.Next() {
			}
			testutil.NotOk(t, r.Err())
			testutil.Ok(t, sr.Close())
			testutil.Ok(t, w.Repair(r.Err()))

			// See https://github.com/prometheus/prometheus/issues/4603
			// We need to close w.segment because it needs to be deleted.
			// But this is to mainly artificially test Repair() again.
			testutil.Ok(t, w.segment.Close())
			testutil.Ok(t, w.Repair(errors.Wrap(r.Err(), "err")))

			sr, err = NewSegmentsReader(dir)
			testutil.Ok(t, err)
			r = NewReader(sr)

			var result [][]byte
			for r.Next() {
				var b []byte
				result = append(result, append(b, r.Record()...))
			}
			testutil.Ok(t, r.Err())
			testutil.Equals(t, test.intactRecs, len(result), "Wrong number of intact records")

			for i, r := range result {
				if !bytes.Equal(records[i], r) {
					t.Fatalf("record %d diverges: want %x, got %x", i, records[i][:10], r[:10])
				}
			}
		})
	}
}

func BenchmarkWAL_LogBatched(b *testing.B) {
	dir, err := ioutil.TempDir("", "bench_logbatch")
	testutil.Ok(b, err)
	defer os.RemoveAll(dir)

	w, err := New(nil, nil, "testdir")
	testutil.Ok(b, err)
	defer w.Close()

	var buf [2048]byte
	var recs [][]byte
	b.SetBytes(2048)

	for i := 0; i < b.N; i++ {
		recs = append(recs, buf[:])
		if len(recs) < 1000 {
			continue
		}
		err := w.Log(recs...)
		testutil.Ok(b, err)
		recs = recs[:0]
	}
	// Stop timer to not count fsync time on close.
	// If it's counted batched vs. single benchmarks are very similar but
	// do not show burst throughput well.
	b.StopTimer()
}

func BenchmarkWAL_Log(b *testing.B) {
	dir, err := ioutil.TempDir("", "bench_logsingle")
	testutil.Ok(b, err)
	defer os.RemoveAll(dir)

	w, err := New(nil, nil, "testdir")
	testutil.Ok(b, err)
	defer w.Close()

	var buf [2048]byte
	b.SetBytes(2048)

	for i := 0; i < b.N; i++ {
		err := w.Log(buf[:])
		testutil.Ok(b, err)
	}
	// Stop timer to not count fsync time on close.
	// If it's counted batched vs. single benchmarks are very similar but
	// do not show burst throughput well.
	b.StopTimer()
}
wal: add write ahead log package This adds a new WAL that's agnostic to the actual record contents. It's much simpler and should be more resilient than the existing one. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-16 05:02:55 -07:00			`// Copyright 2017 The Prometheus Authors`

			`// Licensed under the Apache License, Version 2.0 (the "License");`
			`// you may not use this file except in compliance with the License.`
			`// You may obtain a copy of the License at`
			`//`
			`// http://www.apache.org/licenses/LICENSE-2.0`
			`//`
			`// Unless required by applicable law or agreed to in writing, software`
			`// distributed under the License is distributed on an "AS IS" BASIS,`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.`
			`// See the License for the specific language governing permissions and`
			`// limitations under the License.`

			`package wal`

			`import (`
			`"bytes"`
			`"encoding/binary"`
			`"hash/crc32"`
			`"io/ioutil"`
			`"math/rand"`
			`"os"`
			`"testing"`

Make sure WAL Repair can handle wrapped errors Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> 2018-09-18 23:10:07 -07:00			`"github.com/pkg/errors"`
wal: add write ahead log package This adds a new WAL that's agnostic to the actual record contents. It's much simpler and should be more resilient than the existing one. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-16 05:02:55 -07:00			`"github.com/prometheus/tsdb/testutil"`
			`)`

			`func encodedRecord(t recType, b []byte) []byte {`
			`if t == recPageTerm {`
			`return append([]byte{0}, b...)`
			`}`
			`r := make([]byte, recordHeaderSize)`
			`r[0] = byte(t)`
			`binary.BigEndian.PutUint16(r[1:], uint16(len(b)))`
			`binary.BigEndian.PutUint32(r[3:], crc32.Checksum(b, castagnoliTable))`
			`return append(r, b...)`
			`}`

			`// TestReader feeds the reader a stream of encoded records with different types.`
			`func TestReader(t *testing.T) {`
			`data := make([]byte, 100000)`
			`_, err := rand.Read(data)`
			`testutil.Ok(t, err)`

			`type record struct {`
			`t recType`
			`b []byte`
			`}`
			`cases := []struct {`
			`t []record`
			`exp [][]byte`
			`fail bool`
			`}{`
			`// Sequence of valid records.`
			`{`
			`t: []record{`
			`{recFull, data[0:200]},`
			`{recFirst, data[200:300]},`
			`{recLast, data[300:400]},`
			`{recFirst, data[400:800]},`
			`{recMiddle, data[800:900]},`
			`{recPageTerm, make([]byte, pageSize-900-recordHeaderSize*5-1)}, // exactly lines up with page boundary.`
			`{recLast, data[900:900]},`
			`{recFirst, data[900:1000]},`
			`{recMiddle, data[1000:1200]},`
			`{recMiddle, data[1200:30000]},`
			`{recMiddle, data[30000:30001]},`
			`{recMiddle, data[30001:30001]},`
			`{recLast, data[30001:32000]},`
			`},`
			`exp: [][]byte{`
			`data[0:200],`
			`data[200:400],`
			`data[400:900],`
			`data[900:32000],`
			`},`
			`},`
			`// Exactly at the limit of one page minus the header size`
			`{`
			`t: []record{`
			`{recFull, data[0 : pageSize-recordHeaderSize]},`
			`},`
			`exp: [][]byte{`
			`data[:pageSize-recordHeaderSize],`
			`},`
			`},`
			`// More than a full page, this exceeds our buffer and can never happen`
			`// when written by the WAL.`
			`{`
			`t: []record{`
			`{recFull, data[0 : pageSize+1]},`
			`},`
			`fail: true,`
			`},`
			`// Invalid orders of record types.`
			`{`
			`t: []record{{recMiddle, data[:200]}},`
			`fail: true,`
			`},`
			`{`
			`t: []record{{recLast, data[:200]}},`
			`fail: true,`
			`},`
			`{`
			`t: []record{`
			`{recFirst, data[:200]},`
			`{recFull, data[200:400]},`
			`},`
			`fail: true,`
			`},`
			`{`
			`t: []record{`
			`{recFirst, data[:100]},`
			`{recMiddle, data[100:200]},`
			`{recFull, data[200:400]},`
			`},`
			`fail: true,`
			`},`
			`// Non-zero data after page termination.`
			`{`
			`t: []record{`
			`{recFull, data[:100]},`
			`{recPageTerm, append(make([]byte, 1000), 1)},`
			`},`
			`exp: [][]byte{data[:100]},`
			`fail: true,`
			`},`
			`}`
			`for i, c := range cases {`
			`t.Logf("test %d", i)`

			`var buf []byte`
			`for _, r := range c.t {`
			`buf = append(buf, encodedRecord(r.t, r.b)...)`
			`}`
			`r := NewReader(bytes.NewReader(buf))`

			`for j := 0; r.Next(); j++ {`
			`t.Logf("record %d", j)`
			`rec := r.Record()`

			`if j >= len(c.exp) {`
			`t.Fatal("received more records than inserted")`
			`}`
Add msg parameter to Equals function in testutil (#398) * Add msg parameter to Equals function in testutil Co-authored-by: Chris Marchbanks <csmarchbanks@gmail.com> Signed-off-by: Camille Janicki <camille.janicki@gmail.com> 2018-10-03 01:08:31 -07:00			`testutil.Equals(t, c.exp[j], rec, "Bytes within record did not match expected Bytes")`
wal: add write ahead log package This adds a new WAL that's agnostic to the actual record contents. It's much simpler and should be more resilient than the existing one. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-16 05:02:55 -07:00			`}`
			`if !c.fail && r.Err() != nil {`
			`t.Fatalf("unexpected error: %s", r.Err())`
			`}`
			`if c.fail && r.Err() == nil {`
			`t.Fatalf("expected error but got none")`
			`}`
			`}`
			`}`

			`func TestWAL_FuzzWriteRead(t *testing.T) {`
			`const count = 25000`

			`dir, err := ioutil.TempDir("", "walfuzz")`
			`testutil.Ok(t, err)`
			`defer os.RemoveAll(dir)`

wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`w, err := NewSize(nil, nil, dir, 128*pageSize)`
wal: add write ahead log package This adds a new WAL that's agnostic to the actual record contents. It's much simpler and should be more resilient than the existing one. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-16 05:02:55 -07:00			`testutil.Ok(t, err)`

			`var input [][]byte`
			`var recs [][]byte`

			`for i := 0; i < count; i++ {`
			`var sz int`
			`switch i % 5 {`
			`case 0, 1:`
			`sz = 50`
			`case 2, 3:`
			`sz = pageSize`
			`default:`
			`sz = 8 * pageSize`
			`}`
			`rec := make([]byte, rand.Intn(sz))`
			`_, err := rand.Read(rec)`
			`testutil.Ok(t, err)`

			`input = append(input, rec)`
			`recs = append(recs, rec)`

			`// Randomly batch up records.`
			`if rand.Intn(4) < 3 {`
			`testutil.Ok(t, w.Log(recs...))`
			`recs = recs[:0]`
			`}`
			`}`
			`testutil.Ok(t, w.Log(recs...))`

			`m, n, err := w.Segments()`
			`testutil.Ok(t, err)`

refactor NewSegmentsRangeReader to take multi WAL ranges (#449) * refactor NewSegmentsRangeReader to take multi WAL ranges In case of an error when checkpointing the WAL the error doesn't show the exact WAL index that is corrupter. this is because it uses MultiReader to read multiply WAL files. This refactoring allows the NewSegmentsRangeReader to take more than a single WAL range and it reads all of the ranges by iterating each one. this changes the logs from create checkpoint: read segments: corruption after 4841144384 bytes:... to create checkpoint: read segments: corruption in segment data/wal/00017351 at 123142208: ... Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-30 06:46:16 -08:00			`rc, err := NewSegmentsRangeReader(SegmentRange{Dir: dir, First: m, Last: n})`
wal: add write ahead log package This adds a new WAL that's agnostic to the actual record contents. It's much simpler and should be more resilient than the existing one. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-16 05:02:55 -07:00			`testutil.Ok(t, err)`
			`defer rc.Close()`

			`rdr := NewReader(rc)`

			`for i := 0; rdr.Next(); i++ {`
			`rec := rdr.Record()`
			`if i >= len(input) {`
			`t.Fatal("read too many records")`
			`}`
			`if !bytes.Equal(input[i], rec) {`
			`t.Fatalf("record %d (len %d) does not match (expected len %d)",`
			`i, len(rec), len(input[i]))`
			`}`
			`}`
			`testutil.Ok(t, rdr.Err())`
			`}`

wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`func TestWAL_Repair(t *testing.T) {`
return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00
			`for name, test := range map[string]struct {`
			`corrSgm int // Which segment to corrupt.`
			`corrFunc func(f *os.File) // Func that applies the corruption.`
			`intactRecs int // Total expected records left after the repair.`
			`}{`
			`"torn_last_record": {`
			`2,`
			`func(f *os.File) {`
			`_, err := f.Seek(pageSize*2, 0)`
			`testutil.Ok(t, err)`
			`_, err = f.Write([]byte{byte(recFirst)})`
			`testutil.Ok(t, err)`
			`},`
			`8,`
			`},`
			`// Ensures that the page buffer is big enough to fit`
			`// an entire page size without panicing.`
buffer-panic when reading a record after recPageTerm (#429) Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-14 08:43:33 -08:00			`// https://github.com/prometheus/tsdb/pull/414`
return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`"bad_header": {`
			`1,`
			`func(f *os.File) {`
			`_, err := f.Seek(pageSize, 0)`
			`testutil.Ok(t, err)`
			`_, err = f.Write([]byte{byte(recPageTerm)})`
			`testutil.Ok(t, err)`
			`},`
			`4,`
buffer-panic when reading a record after recPageTerm (#429) Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-14 08:43:33 -08:00			`},`
return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`"bad_fragment_sequence": {`
			`1,`
			`func(f *os.File) {`
			`_, err := f.Seek(pageSize, 0)`
			`testutil.Ok(t, err)`
			`_, err = f.Write([]byte{byte(recLast)})`
			`testutil.Ok(t, err)`
			`},`
			`4,`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`},`
return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`"bad_fragment_flag": {`
			`1,`
			`func(f *os.File) {`
			`_, err := f.Seek(pageSize, 0)`
			`testutil.Ok(t, err)`
			`_, err = f.Write([]byte{123})`
			`testutil.Ok(t, err)`
			`},`
			`4,`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`},`
return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`"bad_checksum": {`
			`1,`
			`func(f *os.File) {`
			`_, err := f.Seek(pageSize+4, 0)`
			`testutil.Ok(t, err)`
			`_, err = f.Write([]byte{0})`
			`testutil.Ok(t, err)`
			`},`
			`4,`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`},`
return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`"bad_length": {`
			`1,`
			`func(f *os.File) {`
			`_, err := f.Seek(pageSize+2, 0)`
			`testutil.Ok(t, err)`
			`_, err = f.Write([]byte{0})`
			`testutil.Ok(t, err)`
			`},`
			`4,`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`},`
return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`"bad_content": {`
			`1,`
			`func(f *os.File) {`
			`_, err := f.Seek(pageSize+100, 0)`
			`testutil.Ok(t, err)`
			`_, err = f.Write([]byte("beef"))`
			`testutil.Ok(t, err)`
			`},`
			`4,`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`},`
			`} {`
			`t.Run(name, func(t *testing.T) {`
			`dir, err := ioutil.TempDir("", "wal_repair")`
			`testutil.Ok(t, err)`
			`defer os.RemoveAll(dir)`

return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`// We create 3 segments with 3 records each and`
			`// then corrupt a given record in a given segment.`
			`// As a result we want a repaired WAL with given intact records.`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`w, err := NewSize(nil, nil, dir, 3*pageSize)`
			`testutil.Ok(t, err)`

			`var records [][]byte`

			`for i := 1; i <= 9; i++ {`
			`b := make([]byte, pageSize-recordHeaderSize)`
			`b[0] = byte(i)`
			`records = append(records, b)`
			`testutil.Ok(t, w.Log(b))`
			`}`
			`testutil.Ok(t, w.Close())`

return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`f, err := os.OpenFile(SegmentName(dir, test.corrSgm), os.O_RDWR, 0666)`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`testutil.Ok(t, err)`

			`// Apply corruption function.`
return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`test.corrFunc(f)`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00
			`testutil.Ok(t, f.Close())`

			`w, err = New(nil, nil, dir)`
			`testutil.Ok(t, err)`

			`sr, err := NewSegmentsReader(dir)`
			`testutil.Ok(t, err)`
			`r := NewReader(sr)`

			`for r.Next() {`
			`}`
			`testutil.NotOk(t, r.Err())`
Fix filehandling for windows (#392) * Fix filehandling for windows Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> * Fix more windows filehandling issues Windows: Close files before deleting Checkpoints. Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: Close writers in case of errors so they can be deleted Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: Close block so that it can be deleted. Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: Close file to delete it Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: Close dir so that it can be deleted. Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: close files so that they can be deleted. Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> * Review feedback Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> 2018-09-20 22:31:22 -07:00			`testutil.Ok(t, sr.Close())`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00			`testutil.Ok(t, w.Repair(r.Err()))`
Fix filehandling for windows (#392) * Fix filehandling for windows Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> * Fix more windows filehandling issues Windows: Close files before deleting Checkpoints. Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: Close writers in case of errors so they can be deleted Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: Close block so that it can be deleted. Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: Close file to delete it Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: Close dir so that it can be deleted. Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> Windows: close files so that they can be deleted. Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> * Review feedback Signed-off-by: Goutham Veeramachaneni <gouthamve@gmail.com> 2018-09-20 22:31:22 -07:00
			`// See https://github.com/prometheus/prometheus/issues/4603`
			`// We need to close w.segment because it needs to be deleted.`
			`// But this is to mainly artificially test Repair() again.`
			`testutil.Ok(t, w.segment.Close())`
			`testutil.Ok(t, w.Repair(errors.Wrap(r.Err(), "err")))`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00
			`sr, err = NewSegmentsReader(dir)`
			`testutil.Ok(t, err)`
			`r = NewReader(sr)`

			`var result [][]byte`
			`for r.Next() {`
			`var b []byte`
			`result = append(result, append(b, r.Record()...))`
			`}`
			`testutil.Ok(t, r.Err())`
return an error when the last wal segment record is torn. (#451) * return an error when the last wal segment record is torn. this ensures that a repair will be run when the last record in a segment is torn. Signed-off-by: Krasi Georgiev <kgeorgie@redhat.com> 2018-11-28 05:15:11 -08:00			`testutil.Equals(t, test.intactRecs, len(result), "Wrong number of intact records")`
wal: add segment type and repair procedure Allow to repair the WAL based on the error returned by a reader during a full scan over all records. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-17 06:00:32 -07:00
			`for i, r := range result {`
			`if !bytes.Equal(records[i], r) {`
			`t.Fatalf("record %d diverges: want %x, got %x", i, records[i][:10], r[:10])`
			`}`
			`}`
			`})`
			`}`
			`}`

wal: add write ahead log package This adds a new WAL that's agnostic to the actual record contents. It's much simpler and should be more resilient than the existing one. Signed-off-by: Fabian Reinartz <freinartz@google.com> 2018-05-16 05:02:55 -07:00			`func BenchmarkWAL_LogBatched(b *testing.B) {`
			`dir, err := ioutil.TempDir("", "bench_logbatch")`
			`testutil.Ok(b, err)`
			`defer os.RemoveAll(dir)`

			`w, err := New(nil, nil, "testdir")`
			`testutil.Ok(b, err)`
			`defer w.Close()`

			`var buf [2048]byte`
			`var recs [][]byte`
			`b.SetBytes(2048)`

			`for i := 0; i < b.N; i++ {`
			`recs = append(recs, buf[:])`
			`if len(recs) < 1000 {`
			`continue`
			`}`
			`err := w.Log(recs...)`
			`testutil.Ok(b, err)`
			`recs = recs[:0]`
			`}`
			`// Stop timer to not count fsync time on close.`
			`// If it's counted batched vs. single benchmarks are very similar but`
			`// do not show burst throughput well.`
			`b.StopTimer()`
			`}`

			`func BenchmarkWAL_Log(b *testing.B) {`
			`dir, err := ioutil.TempDir("", "bench_logsingle")`
			`testutil.Ok(b, err)`
			`defer os.RemoveAll(dir)`

			`w, err := New(nil, nil, "testdir")`
			`testutil.Ok(b, err)`
			`defer w.Close()`

			`var buf [2048]byte`
			`b.SetBytes(2048)`

			`for i := 0; i < b.N; i++ {`
			`err := w.Log(buf[:])`
			`testutil.Ok(b, err)`
			`}`
			`// Stop timer to not count fsync time on close.`
			`// If it's counted batched vs. single benchmarks are very similar but`
			`// do not show burst throughput well.`
			`b.StopTimer()`
			`}`