influxdb/tsdb/tsm1/engine_test.go

620 lines
17 KiB
Go

package tsm1_test
import (
"context"
"fmt"
"io/ioutil"
"math"
"os"
"path/filepath"
"runtime"
"strings"
"sync"
"testing"
"time"
"github.com/influxdata/influxdb"
"github.com/influxdata/influxdb/logger"
"github.com/influxdata/influxdb/models"
"github.com/influxdata/influxdb/toml"
"github.com/influxdata/influxdb/tsdb"
"github.com/influxdata/influxdb/tsdb/tsi1"
"github.com/influxdata/influxdb/tsdb/tsm1"
"github.com/influxdata/influxql"
"go.uber.org/zap"
)
// Test that series id set gets updated and returned appropriately.
func TestIndex_SeriesIDSet(t *testing.T) {
engine := MustOpenEngine()
defer engine.Close()
// Add some series.
engine.MustAddSeries("cpu", map[string]string{"host": "a", "region": "west"})
engine.MustAddSeries("cpu", map[string]string{"host": "b", "region": "west"})
engine.MustAddSeries("cpu", map[string]string{"host": "b"})
engine.MustAddSeries("gpu", nil)
engine.MustAddSeries("gpu", map[string]string{"host": "b"})
engine.MustAddSeries("mem", map[string]string{"host": "z"})
// Collect series IDs.
seriesIDMap := map[string]tsdb.SeriesID{}
var e tsdb.SeriesIDElem
var err error
itr := engine.sfile.SeriesIDIterator()
for e, err = itr.Next(); ; e, err = itr.Next() {
if err != nil {
t.Fatal(err)
} else if e.SeriesID.IsZero() {
break
}
name, tags := tsdb.ParseSeriesKey(engine.sfile.SeriesKey(e.SeriesID))
key := fmt.Sprintf("%s%s", name, tags.HashKey())
seriesIDMap[key] = e.SeriesID
}
for _, id := range seriesIDMap {
if !engine.SeriesIDSet().Contains(id) {
t.Fatalf("bitmap does not contain ID: %d", id)
}
}
// Drop all the series for the gpu measurement and they should no longer
// be in the series ID set.
if err := engine.DeletePrefixRange(context.Background(), []byte("gpu"), math.MinInt64, math.MaxInt64, nil); err != nil {
t.Fatal(err)
}
if engine.SeriesIDSet().Contains(seriesIDMap["gpu"]) {
t.Fatalf("bitmap does not contain ID: %d for key %s, but should", seriesIDMap["gpu"], "gpu")
} else if engine.SeriesIDSet().Contains(seriesIDMap["gpu,host=b"]) {
t.Fatalf("bitmap does not contain ID: %d for key %s, but should", seriesIDMap["gpu,host=b"], "gpu,host=b")
}
delete(seriesIDMap, "gpu")
delete(seriesIDMap, "gpu,host=b")
// The rest of the keys should still be in the set.
for key, id := range seriesIDMap {
if !engine.SeriesIDSet().Contains(id) {
t.Fatalf("bitmap does not contain ID: %d for key %s, but should", id, key)
}
}
// Reopen the engine, and the series should be re-added to the bitmap.
if err := engine.Reopen(); err != nil {
t.Fatal(err)
}
// Check bitset is expected.
expected := tsdb.NewSeriesIDSet()
for _, id := range seriesIDMap {
expected.Add(id)
}
if !engine.SeriesIDSet().Equals(expected) {
t.Fatalf("got bitset %s, expected %s", engine.SeriesIDSet().String(), expected.String())
}
}
func TestEngine_SnapshotsDisabled(t *testing.T) {
sfile := MustOpenSeriesFile()
defer sfile.Close()
// Generate temporary file.
dir, _ := ioutil.TempDir("", "tsm")
defer os.RemoveAll(dir)
// Create a tsm1 engine.
idx := MustOpenIndex(filepath.Join(dir, "index"), tsdb.NewSeriesIDSet(), sfile.SeriesFile)
defer idx.Close()
config := tsm1.NewConfig()
e := tsm1.NewEngine(filepath.Join(dir, "data"), idx, config,
tsm1.WithCompactionPlanner(newMockPlanner()))
e.SetEnabled(false)
if err := e.Open(context.Background()); err != nil {
t.Fatalf("failed to open tsm1 engine: %s", err.Error())
}
defer e.Close()
// Make sure Snapshots are disabled.
e.SetCompactionsEnabled(false)
e.Compactor.DisableSnapshots()
// Writing a snapshot should not fail when the snapshot is empty
// even if snapshots are disabled.
if err := e.WriteSnapshot(context.Background(), tsm1.CacheStatusColdNoWrites); err != nil {
t.Fatalf("failed to snapshot: %s", err.Error())
}
}
func TestEngine_ShouldCompactCache(t *testing.T) {
nowTime := time.Now()
e, err := NewEngine(tsm1.NewConfig())
if err != nil {
t.Fatal(err)
}
// mock the planner so compactions don't run during the test
e.CompactionPlan = &mockPlanner{}
e.SetEnabled(false)
if err := e.Open(context.Background()); err != nil {
t.Fatalf("failed to open tsm1 engine: %s", err.Error())
}
defer e.Close()
if got, exp := e.ShouldCompactCache(nowTime), tsm1.CacheStatusOkay; got != exp {
t.Fatalf("got status %v, exp status %v - nothing written to cache, so should not compact", got, exp)
}
if err := e.WritePointsString("mm", "m,k=v f=3i"); err != nil {
t.Fatal(err)
}
if got, exp := e.ShouldCompactCache(nowTime), tsm1.CacheStatusOkay; got != exp {
t.Fatalf("got status %v, exp status %v - cache size < flush threshold and nothing written to FileStore, so should not compact", got, exp)
}
if got, exp := e.ShouldCompactCache(nowTime.Add(time.Hour)), tsm1.CacheStatusColdNoWrites; got != exp {
t.Fatalf("got status %v, exp status %v - last compaction was longer than flush write cold threshold, so should compact", got, exp)
}
e.CacheFlushMemorySizeThreshold = 1
if got, exp := e.ShouldCompactCache(nowTime), tsm1.CacheStatusSizeExceeded; got != exp {
t.Fatalf("got status %v, exp status %v - cache size > flush threshold, so should compact", got, exp)
}
e.CacheFlushMemorySizeThreshold = 1024 // Reset.
if got, exp := e.ShouldCompactCache(nowTime), tsm1.CacheStatusOkay; got != exp {
t.Fatalf("got status %v, exp status %v - nothing written to cache, so should not compact", got, exp)
}
e.CacheFlushAgeDurationThreshold = 100 * time.Millisecond
time.Sleep(250 * time.Millisecond)
if got, exp := e.ShouldCompactCache(nowTime), tsm1.CacheStatusAgeExceeded; got != exp {
t.Fatalf("got status %v, exp status %v - cache age > max age threshold, so should compact", got, exp)
}
}
func makeBlockTypeSlice(n int) []byte {
r := make([]byte, n)
b := tsm1.BlockFloat64
m := tsm1.BlockUnsigned + 1
for i := 0; i < len(r); i++ {
r[i] = b % m
}
return r
}
var blockType = influxql.Unknown
func BenchmarkBlockTypeToInfluxQLDataType(b *testing.B) {
t := makeBlockTypeSlice(1000)
for i := 0; i < b.N; i++ {
for j := 0; j < len(t); j++ {
blockType = tsm1.BlockTypeToInfluxQLDataType(t[j])
}
}
}
// This test ensures that "sync: WaitGroup is reused before previous Wait has returned" is
// is not raised.
func TestEngine_DisableEnableCompactions_Concurrent(t *testing.T) {
e := MustOpenEngine()
defer e.Close()
var wg sync.WaitGroup
wg.Add(2)
go func() {
defer wg.Done()
for i := 0; i < 1000; i++ {
e.SetCompactionsEnabled(true)
e.SetCompactionsEnabled(false)
}
}()
go func() {
defer wg.Done()
for i := 0; i < 1000; i++ {
e.SetCompactionsEnabled(false)
e.SetCompactionsEnabled(true)
}
}()
done := make(chan struct{})
go func() {
wg.Wait()
close(done)
}()
// Wait for waitgroup or fail if it takes too long.
select {
case <-time.NewTimer(30 * time.Second).C:
t.Fatalf("timed out after 30 seconds waiting for waitgroup")
case <-done:
}
}
func BenchmarkEngine_WritePoints(b *testing.B) {
batchSizes := []int{10, 100, 1000, 5000, 10000}
for _, sz := range batchSizes {
e := MustOpenEngine()
pp := make([]models.Point, 0, sz)
for i := 0; i < sz; i++ {
p := MustParsePointString(fmt.Sprintf("cpu,host=%d value=1.2", i), "mm")
pp = append(pp, p)
}
b.Run(fmt.Sprintf("%d", sz), func(b *testing.B) {
b.ReportAllocs()
for i := 0; i < b.N; i++ {
err := e.WritePoints(pp)
if err != nil {
b.Fatal(err)
}
}
})
e.Close()
}
}
func BenchmarkEngine_WritePoints_Parallel(b *testing.B) {
batchSizes := []int{1000, 5000, 10000, 25000, 50000, 75000, 100000, 200000}
for _, sz := range batchSizes {
e := MustOpenEngine()
cpus := runtime.GOMAXPROCS(0)
pp := make([]models.Point, 0, sz*cpus)
for i := 0; i < sz*cpus; i++ {
p := MustParsePointString(fmt.Sprintf("cpu,host=%d value=1.2,other=%di", i, i), "mm")
pp = append(pp, p)
}
b.Run(fmt.Sprintf("%d", sz), func(b *testing.B) {
b.ReportAllocs()
for i := 0; i < b.N; i++ {
var wg sync.WaitGroup
errC := make(chan error)
for i := 0; i < cpus; i++ {
wg.Add(1)
go func(i int) {
defer wg.Done()
from, to := i*sz, (i+1)*sz
err := e.WritePoints(pp[from:to])
if err != nil {
errC <- err
return
}
}(i)
}
go func() {
wg.Wait()
close(errC)
}()
for err := range errC {
if err != nil {
b.Error(err)
}
}
}
})
e.Close()
}
}
func BenchmarkEngine_DeletePrefixRange_Cache(b *testing.B) {
config := tsm1.NewConfig()
config.Cache.SnapshotMemorySize = toml.Size(256 * 1024 * 1024)
e, err := NewEngine(config)
if err != nil {
b.Fatal(err)
}
if err := e.Open(context.Background()); err != nil {
b.Fatal(err)
}
pp := make([]models.Point, 0, 100000)
for i := 0; i < 100000; i++ {
p := MustParsePointString(fmt.Sprintf("cpu-%d,host=%d value=1.2", i%1000, i), fmt.Sprintf("000000001122111100000000112211%d", i%1000))
pp = append(pp, p)
}
b.Run("exists", func(b *testing.B) {
b.ReportAllocs()
for i := 0; i < b.N; i++ {
b.StopTimer()
if err = e.WritePoints(pp); err != nil {
b.Fatal(err)
}
b.StartTimer()
if err := e.DeletePrefixRange(context.Background(), []byte("0000000011221111000000001122112"), 0, math.MaxInt64, nil); err != nil {
b.Fatal(err)
}
}
})
b.Run("not_exists", func(b *testing.B) {
b.ReportAllocs()
for i := 0; i < b.N; i++ {
b.StopTimer()
if err = e.WritePoints(pp); err != nil {
b.Fatal(err)
}
b.StartTimer()
if err := e.DeletePrefixRange(context.Background(), []byte("fooasdasdasdasdasd"), 0, math.MaxInt64, nil); err != nil {
b.Fatal(err)
}
}
})
e.Close()
}
// Engine is a test wrapper for tsm1.Engine.
type Engine struct {
*tsm1.Engine
root string
indexPath string
index *tsi1.Index
sfile *tsdb.SeriesFile
}
// NewEngine returns a new instance of Engine at a temporary location.
func NewEngine(config tsm1.Config) (*Engine, error) {
root, err := ioutil.TempDir("", "tsm1-")
if err != nil {
panic(err)
}
// Setup series file.
sfile := tsdb.NewSeriesFile(filepath.Join(root, "_series"))
sfile.Logger = zap.NewNop()
if testing.Verbose() {
sfile.Logger = logger.New(os.Stdout)
}
if err = sfile.Open(context.Background()); err != nil {
return nil, err
}
idxPath := filepath.Join(root, "index")
idx := MustOpenIndex(idxPath, tsdb.NewSeriesIDSet(), sfile)
tsm1Engine := tsm1.NewEngine(filepath.Join(root, "data"), idx, config,
tsm1.WithCompactionPlanner(newMockPlanner()))
return &Engine{
Engine: tsm1Engine,
root: root,
indexPath: idxPath,
index: idx,
sfile: sfile,
}, nil
}
// MustOpenEngine returns a new, open instance of Engine.
func MustOpenEngine() *Engine {
e, err := NewEngine(tsm1.NewConfig())
if err != nil {
panic(err)
}
if err := e.Open(context.Background()); err != nil {
panic(err)
}
return e
}
// Close closes the engine and removes all underlying data.
func (e *Engine) Close() error {
return e.close(true)
}
func (e *Engine) close(cleanup bool) error {
err := e.Engine.Close()
if err != nil {
return err
}
if e.index != nil {
e.index.Close()
}
if e.sfile != nil {
e.sfile.Close()
}
if cleanup {
os.RemoveAll(e.root)
}
return nil
}
// Reopen closes and reopens the engine.
func (e *Engine) Reopen() error {
// Close engine without removing underlying engine data.
if err := e.close(false); err != nil {
return err
}
// Re-open series file. Must create a new series file using the same data.
e.sfile = tsdb.NewSeriesFile(e.sfile.Path())
if err := e.sfile.Open(context.Background()); err != nil {
return err
}
// Re-open index.
e.index = MustOpenIndex(e.indexPath, tsdb.NewSeriesIDSet(), e.sfile)
// Re-initialize engine.
config := tsm1.NewConfig()
e.Engine = tsm1.NewEngine(filepath.Join(e.root, "data"), e.index, config,
tsm1.WithCompactionPlanner(newMockPlanner()))
// Reopen engine
if err := e.Engine.Open(context.Background()); err != nil {
return err
}
// Reload series data into index (no-op on TSI).
return nil
}
// SeriesIDSet provides access to the underlying series id bitset in the engine's
// index. It will panic if the underlying index does not have a SeriesIDSet
// method.
func (e *Engine) SeriesIDSet() *tsdb.SeriesIDSet {
return e.index.SeriesIDSet()
}
// AddSeries adds the provided series data to the index and writes a point to
// the engine with default values for a field and a time of now.
func (e *Engine) AddSeries(name string, tags map[string]string) error {
point, err := models.NewPoint(name, models.NewTags(tags), models.Fields{"v": 1.0}, time.Now())
if err != nil {
return err
}
return e.writePoints(point)
}
// WritePointsString calls WritePointsString on the underlying engine, but also
// adds the associated series to the index.
func (e *Engine) WritePointsString(mm string, ptstr ...string) error {
points, err := models.ParsePointsString(strings.Join(ptstr, "\n"), mm)
if err != nil {
return err
}
return e.writePoints(points...)
}
// writePoints adds the series for the provided points to the index, and writes
// the point data to the engine.
func (e *Engine) writePoints(points ...models.Point) error {
// Write into the index.
collection := tsdb.NewSeriesCollection(points)
if err := e.index.CreateSeriesListIfNotExists(collection); err != nil {
return err
}
// Write the points into the cache/wal.
return e.WritePoints(points)
}
// MustAddSeries calls AddSeries, panicking if there is an error.
func (e *Engine) MustAddSeries(name string, tags map[string]string) {
if err := e.AddSeries(name, tags); err != nil {
panic(err)
}
}
// MustWriteSnapshot forces a snapshot of the engine. Panic on error.
func (e *Engine) MustWriteSnapshot() {
if err := e.WriteSnapshot(context.Background(), tsm1.CacheStatusColdNoWrites); err != nil {
panic(err)
}
}
// MustWritePointsString parses and writes the specified points to the
// provided org and bucket. Panic on error.
func (e *Engine) MustWritePointsString(org, bucket influxdb.ID, buf string) {
err := e.writePoints(MustParseExplodePoints(org, bucket, buf)...)
if err != nil {
panic(err)
}
}
// MustDeleteBucketRange calls DeletePrefixRange using the org and bucket for
// the prefix. Panic on error.
func (e *Engine) MustDeleteBucketRange(orgID, bucketID influxdb.ID, min, max int64) {
// TODO(edd): we need to clean up how we're encoding the prefix so that we
// don't have to remember to get it right everywhere we need to touch TSM data.
encoded := tsdb.EncodeName(orgID, bucketID)
name := models.EscapeMeasurement(encoded[:])
err := e.DeletePrefixRange(context.Background(), name, min, max, nil)
if err != nil {
panic(err)
}
}
func MustOpenIndex(path string, seriesIDSet *tsdb.SeriesIDSet, sfile *tsdb.SeriesFile) *tsi1.Index {
idx := tsi1.NewIndex(sfile, tsi1.NewConfig(), tsi1.WithPath(path))
if err := idx.Open(context.Background()); err != nil {
panic(err)
}
return idx
}
// SeriesFile is a test wrapper for tsdb.SeriesFile.
type SeriesFile struct {
*tsdb.SeriesFile
}
// NewSeriesFile returns a new instance of SeriesFile with a temporary file path.
func NewSeriesFile() *SeriesFile {
dir, err := ioutil.TempDir("", "tsdb-series-file-")
if err != nil {
panic(err)
}
return &SeriesFile{SeriesFile: tsdb.NewSeriesFile(dir)}
}
// MustOpenSeriesFile returns a new, open instance of SeriesFile. Panic on error.
func MustOpenSeriesFile() *SeriesFile {
f := NewSeriesFile()
if err := f.Open(context.Background()); err != nil {
panic(err)
}
return f
}
// Close closes the log file and removes it from disk.
func (f *SeriesFile) Close() {
defer os.RemoveAll(f.Path())
if err := f.SeriesFile.Close(); err != nil {
panic(err)
}
}
// MustParsePointsString parses points from a string. Panic on error.
func MustParsePointsString(buf, mm string) []models.Point {
a, err := models.ParsePointsString(buf, mm)
if err != nil {
panic(err)
}
return a
}
// MustParseExplodePoints parses points from a string and transforms using
// ExplodePoints using the provided org and bucket. Panic on error.
func MustParseExplodePoints(org, bucket influxdb.ID, buf string) []models.Point {
encoded := tsdb.EncodeName(org, bucket)
name := models.EscapeMeasurement(encoded[:])
return MustParsePointsString(buf, string(name))
}
// MustParsePointString parses the first point from a string. Panic on error.
func MustParsePointString(buf, mm string) models.Point { return MustParsePointsString(buf, mm)[0] }
type mockPlanner struct{}
func newMockPlanner() tsm1.CompactionPlanner {
return &mockPlanner{}
}
func (m *mockPlanner) Plan(lastWrite time.Time) []tsm1.CompactionGroup { return nil }
func (m *mockPlanner) PlanLevel(level int) []tsm1.CompactionGroup { return nil }
func (m *mockPlanner) PlanOptimize() []tsm1.CompactionGroup { return nil }
func (m *mockPlanner) Release(groups []tsm1.CompactionGroup) {}
func (m *mockPlanner) FullyCompacted() bool { return false }
func (m *mockPlanner) ForceFull() {}
func (m *mockPlanner) SetFileStore(fs *tsm1.FileStore) {}