influxdb/tsdb/engine.go

262 lines
7.1 KiB
Go
Raw Normal View History

2015-07-22 14:53:20 +00:00
package tsdb
import (
"bytes"
2015-07-22 14:53:20 +00:00
"errors"
"fmt"
"io"
"os"
"sort"
2015-07-22 14:53:20 +00:00
"time"
2015-11-04 21:06:06 +00:00
"github.com/influxdb/influxdb/influxql"
"github.com/influxdb/influxdb/models"
2015-07-22 14:53:20 +00:00
)
var (
// ErrFormatNotFound is returned when no format can be determined from a path.
ErrFormatNotFound = errors.New("format not found")
)
// Engine represents a swappable storage engine for the shard.
type Engine interface {
Open() error
Close() error
SetLogOutput(io.Writer)
2015-09-06 22:49:15 +00:00
LoadMetadataIndex(shard *Shard, index *DatabaseIndex, measurementFields map[string]*MeasurementFields) error
2015-07-22 14:53:20 +00:00
Begin(writable bool) (Tx, error)
WritePoints(points []models.Point, measurementFieldsToSave map[string]*MeasurementFields, seriesToCreate []*SeriesCreate) error
2015-07-22 14:53:20 +00:00
DeleteSeries(keys []string) error
DeleteMeasurement(name string, seriesKeys []string) error
SeriesCount() (n int, err error)
// PerformMaintenance will get called periodically by the store
PerformMaintenance()
// Format will return the format for the engine
Format() EngineFormat
io.WriterTo
Backup(w io.Writer, basePath string, since time.Time) error
2015-07-22 14:53:20 +00:00
}
type EngineFormat int
const (
2015-11-04 21:06:06 +00:00
TSM1Format EngineFormat = 2
)
2015-07-22 14:53:20 +00:00
// NewEngineFunc creates a new engine.
type NewEngineFunc func(path string, walPath string, options EngineOptions) Engine
2015-07-22 14:53:20 +00:00
// newEngineFuncs is a lookup of engine constructors by name.
var newEngineFuncs = make(map[string]NewEngineFunc)
// RegisterEngine registers a storage engine initializer by name.
func RegisterEngine(name string, fn NewEngineFunc) {
if _, ok := newEngineFuncs[name]; ok {
panic("engine already registered: " + name)
}
newEngineFuncs[name] = fn
}
// RegisteredEngines returns the slice of currently registered engines.
func RegisteredEngines() []string {
a := make([]string, 0, len(newEngineFuncs))
for k, _ := range newEngineFuncs {
a = append(a, k)
}
sort.Strings(a)
return a
}
2015-07-22 14:53:20 +00:00
// NewEngine returns an instance of an engine based on its format.
// If the path does not exist then the DefaultFormat is used.
func NewEngine(path string, walPath string, options EngineOptions) (Engine, error) {
2015-07-22 14:53:20 +00:00
// Create a new engine
if _, err := os.Stat(path); os.IsNotExist(err) {
return newEngineFuncs[options.EngineVersion](path, walPath, options), nil
2015-07-22 14:53:20 +00:00
}
2015-11-04 21:06:06 +00:00
// If it's a dir then it's a tsm1 engine
2015-07-22 14:53:20 +00:00
var format string
2015-11-04 21:06:06 +00:00
if fi, err := os.Stat(path); err != nil {
2015-07-22 14:53:20 +00:00
return nil, err
2015-11-04 21:06:06 +00:00
} else if !fi.Mode().IsDir() {
return nil, errors.New("unknown engine type")
} else {
format = "tsm1"
2015-07-22 14:53:20 +00:00
}
// Lookup engine by format.
fn := newEngineFuncs[format]
if fn == nil {
return nil, fmt.Errorf("invalid engine format: %q", format)
}
return fn(path, walPath, options), nil
2015-07-22 14:53:20 +00:00
}
// EngineOptions represents the options used to initialize the engine.
type EngineOptions struct {
EngineVersion string
2015-07-22 14:53:20 +00:00
MaxWALSize int
WALFlushInterval time.Duration
WALPartitionFlushDelay time.Duration
2015-08-18 20:59:54 +00:00
Config Config
2015-07-22 14:53:20 +00:00
}
// NewEngineOptions returns the default options.
func NewEngineOptions() EngineOptions {
return EngineOptions{
EngineVersion: DefaultEngine,
2015-07-22 14:53:20 +00:00
MaxWALSize: DefaultMaxWALSize,
WALFlushInterval: DefaultWALFlushInterval,
WALPartitionFlushDelay: DefaultWALPartitionFlushDelay,
2015-08-18 20:59:54 +00:00
Config: NewConfig(),
2015-07-22 14:53:20 +00:00
}
}
// Tx represents a transaction.
type Tx interface {
io.WriterTo
Size() int64
Commit() error
Rollback() error
2015-09-20 22:27:22 +00:00
Cursor(series string, fields []string, dec *FieldCodec, ascending bool) Cursor
2015-07-22 14:53:20 +00:00
}
2015-11-04 21:06:06 +00:00
func newTxIterator(tx Tx, sh *Shard, opt influxql.IteratorOptions, dimensions map[string]struct{}) (influxql.Iterator, error) {
// If there's no expression then it's just an auxilary field selection.
if opt.Expr == nil {
return newTxVarRefIterator(tx, sh, opt, dimensions)
}
// If raw data is being read then read it directly.
// Otherwise wrap it in a call iterator.
switch expr := opt.Expr.(type) {
case *influxql.VarRef:
return newTxVarRefIterator(tx, sh, opt, dimensions)
case *influxql.Call:
refOpt := opt
refOpt.Expr = expr.Args[0].(*influxql.VarRef)
input, err := newTxVarRefIterator(tx, sh, refOpt, dimensions)
if err != nil {
return nil, err
}
return influxql.NewCallIterator(input, opt), nil
default:
panic(fmt.Sprintf("unsupported tx iterator expr: %T", expr))
}
}
// newTxVarRefIterator creates an tx iterator for a variable reference.
func newTxVarRefIterator(tx Tx, sh *Shard, opt influxql.IteratorOptions, dimensions map[string]struct{}) (influxql.Iterator, error) {
ref, _ := opt.Expr.(*influxql.VarRef)
var itrs []influxql.Iterator
if err := func() error {
mms := Measurements(sh.index.MeasurementsByName(influxql.Sources(opt.Sources).Names()))
2015-12-23 18:05:05 +00:00
// Retrieve non-time field names from condition.
conditionFields := influxql.ExprNames(opt.Condition)
2015-11-04 21:06:06 +00:00
for _, mm := range mms {
// Determine tagsets for this measurement based on dimensions and filters.
tagSets, err := mm.TagSets(opt.Dimensions, opt.Condition)
if err != nil {
return err
}
2015-12-22 22:46:10 +00:00
// Calculate tag sets and apply SLIMIT/SOFFSET.
tagSets = influxql.LimitTagSets(tagSets, opt.SLimit, opt.SOffset)
2015-11-04 21:06:06 +00:00
for _, t := range tagSets {
for i, seriesKey := range t.SeriesKeys {
// Create field list for cursor.
fields := make([]string, 0, len(opt.Aux)+1)
if ref != nil {
fields = append(fields, ref.Val)
}
fields = append(fields, opt.Aux...)
2015-12-23 18:05:05 +00:00
fields = append(fields, conditionFields...)
2015-11-04 21:06:06 +00:00
// Create cursor.
cur := tx.Cursor(seriesKey, fields, sh.FieldCodec(mm.Name), opt.Ascending)
if cur == nil {
continue
}
// Create options specific for this series.
curOpt := opt
curOpt.Condition = t.Filters[i]
itr := NewFloatCursorIterator(mm.Name, sh.index.TagsForSeries(seriesKey), cur, curOpt)
itrs = append(itrs, itr)
}
}
}
return nil
}(); err != nil {
influxql.Iterators(itrs).Close()
return nil, err
}
// Merge iterators into one.
itr := influxql.NewMergeIterator(itrs, opt)
switch itr := itr.(type) {
case influxql.FloatIterator:
return &txFloatIterator{tx: tx, itr: itr}, nil
default:
panic(fmt.Sprintf("unsupported tx iterator input type: %T", itr))
}
}
// txFloatIterator represents an iterator with an attached transaction.
// It is used to track the Tx so it can be closed.
type txFloatIterator struct {
tx Tx
itr influxql.FloatIterator
}
// Close closes the underlying iterator and rolls back the transaction.
func (itr *txFloatIterator) Close() error {
defer itr.tx.Rollback()
return itr.itr.Close()
}
// Next returns the next point.
func (itr *txFloatIterator) Next() *influxql.FloatPoint { return itr.itr.Next() }
// DedupeEntries returns slices with unique keys (the first 8 bytes).
func DedupeEntries(a [][]byte) [][]byte {
// Convert to a map where the last slice is used.
m := make(map[string][]byte)
for _, b := range a {
m[string(b[0:8])] = b
}
// Convert map back to a slice of byte slices.
other := make([][]byte, 0, len(m))
for _, v := range m {
other = append(other, v)
}
// Sort entries.
sort.Sort(ByteSlices(other))
return other
}
type ByteSlices [][]byte
func (a ByteSlices) Len() int { return len(a) }
func (a ByteSlices) Swap(i, j int) { a[i], a[j] = a[j], a[i] }
func (a ByteSlices) Less(i, j int) bool { return bytes.Compare(a[i], a[j]) == -1 }