influxdb/tsdb/tsi1/index_file_test.go

272 lines
7.9 KiB
Go

package tsi1_test
import (
"bytes"
"context"
"fmt"
"reflect"
"testing"
"time"
"github.com/influxdata/influxdb/models"
"github.com/influxdata/influxdb/tsdb"
"github.com/influxdata/influxdb/tsdb/seriesfile"
"github.com/influxdata/influxdb/tsdb/tsi1"
)
// Ensure a simple index file can be built and opened.
func TestCreateIndexFile(t *testing.T) {
sfile := MustOpenSeriesFile()
defer sfile.Close()
f, err := CreateIndexFile(sfile.SeriesFile, []Series{
{Name: []byte("cpu"), Tags: models.NewTags(map[string]string{"region": "east"}), Type: models.Integer},
{Name: []byte("cpu"), Tags: models.NewTags(map[string]string{"region": "west"}), Type: models.Integer},
{Name: []byte("mem"), Tags: models.NewTags(map[string]string{"region": "east"}), Type: models.Integer},
})
if err != nil {
t.Fatal(err)
}
defer f.Close()
if e := f.TagValueElem([]byte("cpu"), []byte("region"), []byte("west")); e == nil {
t.Fatal("expected element")
} else if n := e.(*tsi1.TagBlockValueElem).SeriesN(); n != 1 {
t.Fatalf("unexpected series count: %d", n)
}
}
func TestIndexFile_TagKeySeriesIDIterator(t *testing.T) {
sfile := MustOpenSeriesFile()
defer sfile.Close()
f, err := CreateIndexFile(sfile.SeriesFile, []Series{
{Name: []byte("mem"), Tags: models.NewTags(map[string]string{"region": "east"}), Type: models.Integer},
{Name: []byte("cpu"), Tags: models.NewTags(map[string]string{"region": "east"}), Type: models.Integer},
{Name: []byte("cpu"), Tags: models.NewTags(map[string]string{"region": "west"}), Type: models.Integer},
})
if err != nil {
t.Fatal(err)
}
defer f.Close()
itr, err := f.TagKeySeriesIDIterator([]byte("cpu"), []byte("region"))
if err != nil {
t.Fatal(err)
}
defer itr.Close()
// NOTE(edd): the series keys end up being emitted in this order because the
// series were written to different partitons in the _series file_. As such,
// the key with region=west ends up with a lower series ID than the region=east
// series, even though it was written later. When the series id sets for each
// tag block in the index file are merged together and iterated, the roaring
// bitmap library sorts the series ids, resulting the the series keys being
// emitted in a different order to that which they were written.
exp := []string{"cpu,region=west", "cpu,region=east"}
var got []string
for {
e, err := itr.Next()
if err != nil {
t.Fatal(err)
}
if e.SeriesID.ID == 0 {
break
}
fmt.Println(e.SeriesID.ID)
name, tags := seriesfile.ParseSeriesKey(sfile.SeriesKey(e.SeriesID))
got = append(got, string(models.MustNewPoint(string(name), tags, models.Fields{"a": "a"}, time.Time{}).Key()))
}
if !reflect.DeepEqual(got, exp) {
t.Fatalf("got keys %v, expected %v", got, exp)
}
}
// Ensure index file generation can be successfully built.
func TestGenerateIndexFile(t *testing.T) {
sfile := MustOpenSeriesFile()
defer sfile.Close()
// Build generated index file.
f, err := GenerateIndexFile(sfile.SeriesFile, 10, 3, 4)
if err != nil {
t.Fatal(err)
}
defer f.Close()
// Verify that tag/value series can be fetched.
if e := f.TagValueElem([]byte("measurement0"), []byte("key0"), []byte("value0")); e == nil {
t.Fatal("expected element")
} else if n := e.(*tsi1.TagBlockValueElem).SeriesN(); n == 0 {
t.Fatal("expected series")
}
}
// Ensure index file generated with uvarint encoding can be loaded.
func TestGenerateIndexFile_Uvarint(t *testing.T) {
// Load previously generated series file.
sfile := seriesfile.NewSeriesFile("testdata/uvarint/_series")
if err := sfile.Open(context.Background()); err != nil {
t.Fatal(err)
}
defer sfile.Close()
// Load legacy index file from buffer.
f := tsi1.NewIndexFile(sfile)
f.SetPath("testdata/uvarint/index")
if err := f.Open(); err != nil {
t.Fatal(err)
}
defer f.Close()
// Verify that tag/value series can be fetched.
if e := f.TagValueElem([]byte("measurement0"), []byte("key0"), []byte("value0")); e == nil {
t.Fatal("expected element")
} else if n := e.(*tsi1.TagBlockValueElem).SeriesN(); n == 0 {
t.Fatal("expected series")
}
}
// Ensure a MeasurementHashSeries returns false when all series are tombstoned.
func TestIndexFile_MeasurementHasSeries_Tombstoned(t *testing.T) {
sfile := MustOpenSeriesFile()
defer sfile.Close()
f, err := CreateIndexFile(sfile.SeriesFile, []Series{
{Name: []byte("cpu"), Tags: models.NewTags(map[string]string{"region": "east"}), Type: models.Integer},
})
if err != nil {
t.Fatal(err)
}
defer f.Close()
// Simulate all series are tombstoned
ss := tsdb.NewSeriesIDSet()
if f.MeasurementHasSeries(ss, []byte("cpu")) {
t.Fatalf("MeasurementHasSeries got true, exp false")
}
}
func BenchmarkIndexFile_TagValueSeries(b *testing.B) {
b.Run("M=1,K=2,V=3", func(b *testing.B) {
sfile := MustOpenSeriesFile()
defer sfile.Close()
benchmarkIndexFile_TagValueSeries(b, MustFindOrGenerateIndexFile(sfile.SeriesFile, 1, 2, 3))
})
b.Run("M=10,K=5,V=5", func(b *testing.B) {
sfile := MustOpenSeriesFile()
defer sfile.Close()
benchmarkIndexFile_TagValueSeries(b, MustFindOrGenerateIndexFile(sfile.SeriesFile, 10, 5, 5))
})
b.Run("M=10,K=7,V=5", func(b *testing.B) {
sfile := MustOpenSeriesFile()
defer sfile.Close()
benchmarkIndexFile_TagValueSeries(b, MustFindOrGenerateIndexFile(sfile.SeriesFile, 10, 7, 7))
})
}
func benchmarkIndexFile_TagValueSeries(b *testing.B, idx *tsi1.IndexFile) {
b.ResetTimer()
b.ReportAllocs()
for i := 0; i < b.N; i++ {
if e := idx.TagValueElem([]byte("measurement0"), []byte("key0"), []byte("value0")); e == nil {
b.Fatal("expected element")
} else if e.(*tsi1.TagBlockValueElem).SeriesN() == 0 {
b.Fatal("expected series")
}
}
}
// CreateIndexFile creates an index file with a given set of series.
func CreateIndexFile(sfile *seriesfile.SeriesFile, series []Series) (*tsi1.IndexFile, error) {
lf, err := CreateLogFile(sfile, series)
if err != nil {
return nil, err
}
defer lf.Close()
// Write index file to buffer.
var buf bytes.Buffer
if _, err := lf.CompactTo(&buf, M, K, nil); err != nil {
return nil, err
}
// Load index file from buffer.
f := tsi1.NewIndexFile(sfile)
if err := f.UnmarshalBinary(buf.Bytes()); err != nil {
return nil, err
}
return f, nil
}
// GenerateIndexFile generates an index file from a set of series based on the count arguments.
// Total series returned will equal measurementN * tagN * valueN.
func GenerateIndexFile(sfile *seriesfile.SeriesFile, measurementN, tagN, valueN int) (*tsi1.IndexFile, error) {
// Generate a new log file first.
lf, err := GenerateLogFile(sfile, measurementN, tagN, valueN)
if err != nil {
return nil, err
}
defer lf.Close()
// Compact log file to buffer.
var buf bytes.Buffer
if _, err := lf.CompactTo(&buf, M, K, nil); err != nil {
return nil, err
}
// Load index file from buffer.
f := tsi1.NewIndexFile(sfile)
if err := f.UnmarshalBinary(buf.Bytes()); err != nil {
return nil, err
}
return f, nil
}
func MustGenerateIndexFile(sfile *seriesfile.SeriesFile, measurementN, tagN, valueN int) *tsi1.IndexFile {
f, err := GenerateIndexFile(sfile, measurementN, tagN, valueN)
if err != nil {
panic(err)
}
return f
}
var indexFileCache struct {
MeasurementN int
TagN int
ValueN int
IndexFile *tsi1.IndexFile
}
// MustFindOrGenerateIndexFile returns a cached index file or generates one if it doesn't exist.
func MustFindOrGenerateIndexFile(sfile *seriesfile.SeriesFile, measurementN, tagN, valueN int) *tsi1.IndexFile {
// Use cache if fields match and the index file has been generated.
if indexFileCache.MeasurementN == measurementN &&
indexFileCache.TagN == tagN &&
indexFileCache.ValueN == valueN &&
indexFileCache.IndexFile != nil {
return indexFileCache.IndexFile
}
// Generate and cache.
indexFileCache.MeasurementN = measurementN
indexFileCache.TagN = tagN
indexFileCache.ValueN = valueN
indexFileCache.IndexFile = MustGenerateIndexFile(sfile, measurementN, tagN, valueN)
return indexFileCache.IndexFile
}
func pow(x, y int) int {
r := 1
for i := 0; i < y; i++ {
r *= x
}
return r
}