From 0883182798c8155b066fdc7754f70e759c5b258e Mon Sep 17 00:00:00 2001 From: Ben Johnson Date: Fri, 11 Sep 2015 11:57:33 -0600 Subject: [PATCH 1/8] simplify select mapper stmt --- tsdb/executor.go | 2 +- tsdb/mapper.go | 80 ++++++++++++++++----------------------- tsdb/show_measurements.go | 5 +-- 3 files changed, 34 insertions(+), 53 deletions(-) diff --git a/tsdb/executor.go b/tsdb/executor.go index 3d777751f0..78d65c9488 100644 --- a/tsdb/executor.go +++ b/tsdb/executor.go @@ -30,7 +30,7 @@ type Executor interface { // Mapper is the interface all Mapper types must implement. type Mapper interface { Open() error - SetRemote(m Mapper) error + SetRemote(m Mapper) TagSets() []string Fields() []string NextChunk() (interface{}, error) diff --git a/tsdb/mapper.go b/tsdb/mapper.go index 11e6f52bc3..6baea3b084 100644 --- a/tsdb/mapper.go +++ b/tsdb/mapper.go @@ -110,8 +110,7 @@ func (mo *MapperOutput) key() string { type SelectMapper struct { shard *Shard remote Mapper - stmt influxql.Statement - selectStmt *influxql.SelectStatement + stmt *influxql.SelectStatement rawMode bool chunkSize int tx Tx // Read transaction for this shard. @@ -135,7 +134,7 @@ type SelectMapper struct { } // NewSelectMapper returns a mapper for the given shard, which will return data for the SELECT statement. -func NewSelectMapper(shard *Shard, stmt influxql.Statement, chunkSize int) *SelectMapper { +func NewSelectMapper(shard *Shard, stmt *influxql.SelectStatement, chunkSize int) *SelectMapper { return &SelectMapper{ shard: shard, stmt: stmt, @@ -144,14 +143,9 @@ func NewSelectMapper(shard *Shard, stmt influxql.Statement, chunkSize int) *Sele } } -// openMeta opens the mapper for a meta query. -func (lm *SelectMapper) openMeta() error { - return errors.New("not implemented") -} - func (lm *SelectMapper) timeDirection() Direction { - if len(lm.selectStmt.SortFields) > 0 { - if lm.selectStmt.SortFields[0].Ascending { + if len(lm.stmt.SortFields) > 0 { + if lm.stmt.SortFields[0].Ascending { return Forward } else { return Reverse @@ -190,23 +184,19 @@ func (lm *SelectMapper) Open() error { lm.tx = tx if err := func() error { - if s, ok := lm.stmt.(*influxql.SelectStatement); ok { - stmt, err := lm.rewriteSelectStatement(s) - if err != nil { - return err - } - lm.selectStmt = stmt - lm.rawMode = (s.IsRawQuery && !s.HasDistinct()) || s.IsSimpleDerivative() - } else { - return lm.openMeta() + stmt, err := lm.rewriteSelectStatement(lm.stmt) + if err != nil { + return err } + lm.stmt = stmt + lm.rawMode = (stmt.IsRawQuery && !stmt.HasDistinct()) || stmt.IsSimpleDerivative() // Set all time-related parameters on the mapper. - lm.queryTMin, lm.queryTMax = influxql.TimeRangeAsEpochNano(lm.selectStmt.Condition) + lm.queryTMin, lm.queryTMax = influxql.TimeRangeAsEpochNano(lm.stmt.Condition) if !lm.rawMode { // For GROUP BY time queries, limit the number of data points returned by the limit and offset - d, err := lm.selectStmt.GroupByInterval() + d, err := lm.stmt.GroupByInterval() if err != nil { return err } @@ -220,16 +210,16 @@ func (lm *SelectMapper) Open() error { lm.numIntervals = int((intervalTop - intervalBottom) / lm.intervalSize) } - if lm.selectStmt.Limit > 0 || lm.selectStmt.Offset > 0 { + if lm.stmt.Limit > 0 || lm.stmt.Offset > 0 { // ensure that the offset isn't higher than the number of points we'd get - if lm.selectStmt.Offset > lm.numIntervals { + if lm.stmt.Offset > lm.numIntervals { return nil } // Take the lesser of either the pre computed number of GROUP BY buckets that // will be in the result or the limit passed in by the user - if lm.selectStmt.Limit < lm.numIntervals { - lm.numIntervals = lm.selectStmt.Limit + if lm.stmt.Limit < lm.numIntervals { + lm.numIntervals = lm.stmt.Limit } } @@ -250,7 +240,7 @@ func (lm *SelectMapper) Open() error { whereFields := newStringSet() // Create the TagSet cursors for the Mapper. - for _, src := range lm.selectStmt.Sources { + for _, src := range lm.stmt.Sources { mm, ok := src.(*influxql.Measurement) if !ok { return fmt.Errorf("invalid source type: %#v", src) @@ -264,12 +254,12 @@ func (lm *SelectMapper) Open() error { } // Validate that ANY GROUP BY is not a field for the measurement. - if err := m.ValidateGroupBy(lm.selectStmt); err != nil { + if err := m.ValidateGroupBy(lm.stmt); err != nil { return err } // Create tagset cursors and determine various field types within SELECT statement. - tsf, err := createTagSetsAndFields(m, lm.selectStmt) + tsf, err := createTagSetsAndFields(m, lm.stmt) if err != nil { return err } @@ -284,20 +274,20 @@ func (lm *SelectMapper) Open() error { } // Validate that any GROUP BY is not on a field - if err := m.ValidateGroupBy(lm.selectStmt); err != nil { + if err := m.ValidateGroupBy(lm.stmt); err != nil { return err } // SLIMIT and SOFFSET the unique series - if lm.selectStmt.SLimit > 0 || lm.selectStmt.SOffset > 0 { - if lm.selectStmt.SOffset > len(tagSets) { + if lm.stmt.SLimit > 0 || lm.stmt.SOffset > 0 { + if lm.stmt.SOffset > len(tagSets) { tagSets = nil } else { - if lm.selectStmt.SOffset+lm.selectStmt.SLimit > len(tagSets) { - lm.selectStmt.SLimit = len(tagSets) - lm.selectStmt.SOffset + if lm.stmt.SOffset+lm.stmt.SLimit > len(tagSets) { + lm.stmt.SLimit = len(tagSets) - lm.stmt.SOffset } - tagSets = tagSets[lm.selectStmt.SOffset : lm.selectStmt.SOffset+lm.selectStmt.SLimit] + tagSets = tagSets[lm.stmt.SOffset : lm.stmt.SOffset+lm.stmt.SLimit] } } @@ -376,10 +366,7 @@ func (lm *SelectMapper) Open() error { return nil } -func (lm *SelectMapper) SetRemote(m Mapper) error { - lm.remote = m - return nil -} +func (lm *SelectMapper) SetRemote(m Mapper) { lm.remote = m } func (lm *SelectMapper) NextChunk() (interface{}, error) { // If set, use remote mapper. @@ -575,10 +562,10 @@ func (lm *SelectMapper) nextChunkAgg() (interface{}, error) { } tminf := func() int64 { - if len(lm.selectStmt.Dimensions) == 0 { + if len(lm.stmt.Dimensions) == 0 { return -1 } - if !lm.selectStmt.HasTimeFieldSpecified() { + if !lm.stmt.HasTimeFieldSpecified() { return tmin } return -1 @@ -602,7 +589,7 @@ func (lm *SelectMapper) nextChunkAgg() (interface{}, error) { // nextInterval returns the next interval for which to return data. If start is less than 0 // there are no more intervals. func (lm *SelectMapper) nextInterval() (start, end int64) { - t := lm.queryTMinWindow + int64(lm.currInterval+lm.selectStmt.Offset)*lm.intervalSize + t := lm.queryTMinWindow + int64(lm.currInterval+lm.stmt.Offset)*lm.intervalSize // Onto next interval. lm.currInterval++ @@ -619,12 +606,7 @@ func (lm *SelectMapper) nextInterval() (start, end int64) { func (lm *SelectMapper) initializeMapFunctions() error { var err error // Set up each mapping function for this statement. - selectStmt, ok := lm.stmt.(*influxql.SelectStatement) - if !ok { - return fmt.Errorf("No map functions for non-SELECT statement: %s", lm.stmt.String()) - } - - aggregates := selectStmt.FunctionCalls() + aggregates := lm.stmt.FunctionCalls() lm.mapFuncs = make([]mapFunc, len(aggregates)) lm.mapUnmarshallers = make([]unmarshalFunc, len(aggregates)) lm.fieldNames = make([]string, len(lm.mapFuncs)) @@ -661,19 +643,21 @@ func (lm *SelectMapper) initializeMapFunctions() error { // rewriteSelectStatement performs any necessary query re-writing. func (lm *SelectMapper) rewriteSelectStatement(stmt *influxql.SelectStatement) (*influxql.SelectStatement, error) { - var err error // Expand regex expressions in the FROM clause. sources, err := expandSources(stmt.Sources, lm.shard.index) if err != nil { return nil, err } stmt.Sources = sources + // Expand wildcards in the fields or GROUP BY. stmt, err = lm.expandWildcards(stmt) if err != nil { return nil, err } + stmt.RewriteDistinct() + return stmt, nil } diff --git a/tsdb/show_measurements.go b/tsdb/show_measurements.go index 90c035dacf..4aa5e8f002 100644 --- a/tsdb/show_measurements.go +++ b/tsdb/show_measurements.go @@ -176,10 +176,7 @@ func (m *ShowMeasurementsMapper) Open() error { } // SetRemote sets the remote mapper to use. -func (m *ShowMeasurementsMapper) SetRemote(remote Mapper) error { - m.remote = remote - return nil -} +func (m *ShowMeasurementsMapper) SetRemote(remote Mapper) { m.remote = remote } // TagSets is only implemented on this mapper to satisfy the Mapper interface. func (m *ShowMeasurementsMapper) TagSets() []string { return nil } From 1b8b6257871dc3dd3b4613e28b53008d72c67d3a Mon Sep 17 00:00:00 2001 From: Ben Johnson Date: Wed, 16 Sep 2015 14:17:58 -0600 Subject: [PATCH 2/8] refactor SelectMapper --- cluster/shard_mapper.go | 83 ++- cluster/shard_mapper_test.go | 6 +- influxql/ast.go | 12 + tsdb/cursor.go | 276 +++++++ tsdb/executor.go | 33 - tsdb/functions.go | 4 +- tsdb/mapper.go | 1333 +++++++++++----------------------- tsdb/mapper_test.go | 23 +- tsdb/meta.go | 247 +++++++ tsdb/show_measurements.go | 24 +- tsdb/store.go | 17 +- 11 files changed, 1073 insertions(+), 985 deletions(-) diff --git a/cluster/shard_mapper.go b/cluster/shard_mapper.go index 88000bde71..0b2fc7a072 100644 --- a/cluster/shard_mapper.go +++ b/cluster/shard_mapper.go @@ -1,6 +1,7 @@ package cluster import ( + "encoding/json" "fmt" "math/rand" "net" @@ -40,11 +41,7 @@ func NewShardMapper(timeout time.Duration) *ShardMapper { // CreateMapper returns a Mapper for the given shard ID. func (s *ShardMapper) CreateMapper(sh meta.ShardInfo, stmt influxql.Statement, chunkSize int) (tsdb.Mapper, error) { - m, err := s.TSDBStore.CreateMapper(sh.ID, stmt, chunkSize) - if err != nil { - return nil, err - } - + // Create a remote mapper if the local node doesn't own the shard. if !sh.OwnedBy(s.MetaStore.NodeID()) || s.ForceRemoteMapping { // Pick a node in a pseudo-random manner. conn, err := s.dial(sh.Owners[rand.Intn(len(sh.Owners))].NodeID) @@ -53,7 +50,13 @@ func (s *ShardMapper) CreateMapper(sh meta.ShardInfo, stmt influxql.Statement, c } conn.SetDeadline(time.Now().Add(s.timeout)) - m.SetRemote(NewRemoteMapper(conn, sh.ID, stmt, chunkSize)) + return NewRemoteMapper(conn, sh.ID, stmt, chunkSize), nil + } + + // If it is local then return the mapper from the store. + m, err := s.TSDBStore.CreateMapper(sh.ID, stmt, chunkSize) + if err != nil { + return nil, err } return m, nil @@ -87,6 +90,8 @@ type RemoteMapper struct { conn net.Conn bufferedResponse *MapShardResponse + + unmarshallers []tsdb.UnmarshalFunc // Mapping-specific unmarshal functions. } // NewRemoteMapper returns a new remote mapper using the given connection. @@ -106,6 +111,7 @@ func (r *RemoteMapper) Open() (err error) { r.conn.Close() } }() + // Build Map request. var request MapShardRequest request.SetShardID(r.shardID) @@ -143,11 +149,18 @@ func (r *RemoteMapper) Open() (err error) { r.tagsets = r.bufferedResponse.TagSets() r.fields = r.bufferedResponse.Fields() - return nil -} + // Set up each mapping function for this statement. + if stmt, ok := r.stmt.(*influxql.SelectStatement); ok { + for _, c := range stmt.FunctionCalls() { + fn, err := tsdb.InitializeUnmarshaller(c) + if err != nil { + return err + } + r.unmarshallers = append(r.unmarshallers, fn) + } + } -func (r *RemoteMapper) SetRemote(m tsdb.Mapper) error { - return fmt.Errorf("cannot set remote mapper on a remote mapper") + return nil } func (r *RemoteMapper) TagSets() []string { @@ -187,7 +200,55 @@ func (r *RemoteMapper) NextChunk() (chunk interface{}, err error) { return nil, nil } - return response.Data(), err + moj := &tsdb.MapperOutputJSON{} + if err := json.Unmarshal(response.Data(), moj); err != nil { + return nil, err + } + mvj := []*tsdb.MapperValueJSON{} + if err := json.Unmarshal(moj.Values, &mvj); err != nil { + return nil, err + } + + // Prep the non-JSON version of Mapper output. + mo := &tsdb.MapperOutput{ + Name: moj.Name, + Tags: moj.Tags, + Fields: moj.Fields, + } + + if len(mvj) == 1 && len(mvj[0].AggData) > 0 { + // The MapperValue is carrying aggregate data, so run it through the + // custom unmarshallers for the map functions through which the data + // was mapped. + aggValues := []interface{}{} + for i, b := range mvj[0].AggData { + v, err := r.unmarshallers[i](b) + if err != nil { + return nil, err + } + aggValues = append(aggValues, v) + } + mo.Values = []*tsdb.MapperValue{&tsdb.MapperValue{ + Value: aggValues, + Tags: mvj[0].Tags, + }} + } else { + // Must be raw data instead. + for _, v := range mvj { + var rawValue interface{} + if err := json.Unmarshal(v.RawData, &rawValue); err != nil { + return nil, err + } + + mo.Values = append(mo.Values, &tsdb.MapperValue{ + Time: v.Time, + Value: rawValue, + Tags: v.Tags, + }) + } + } + + return mo, nil } // Close the Mapper diff --git a/cluster/shard_mapper_test.go b/cluster/shard_mapper_test.go index 9557352994..3a80f596e5 100644 --- a/cluster/shard_mapper_test.go +++ b/cluster/shard_mapper_test.go @@ -80,14 +80,10 @@ func TestShardWriter_RemoteMapper_Success(t *testing.T) { if err != nil { t.Fatalf("failed to get next chunk from mapper: %s", err.Error()) } - b, ok := chunk.([]byte) + output, ok := chunk.(*tsdb.MapperOutput) if !ok { t.Fatal("chunk is not of expected type") } - output := &tsdb.MapperOutput{} - if err := json.Unmarshal(b, output); err != nil { - t.Fatal(err) - } if output.Name != "cpu" { t.Fatalf("received output incorrect, exp: %v, got %v", expOutput, output) } diff --git a/influxql/ast.go b/influxql/ast.go index 56eb8683e3..3a343d6a5c 100644 --- a/influxql/ast.go +++ b/influxql/ast.go @@ -743,6 +743,11 @@ func (s *SelectStatement) IsSimpleDerivative() bool { return false } +// TimeAscending returns true if the time field is sorted in chronological order. +func (s *SelectStatement) TimeAscending() bool { + return len(s.SortFields) == 0 || s.SortFields[0].Ascending +} + // Clone returns a deep copy of the statement. func (s *SelectStatement) Clone() *SelectStatement { clone := &SelectStatement{ @@ -2937,6 +2942,13 @@ func evalBinaryExpr(expr *BinaryExpr, m map[string]interface{}) interface{} { return nil } +// EvalBool evaluates expr and returns true if result is a boolean true. +// Otherwise returns false. +func EvalBool(expr Expr, m map[string]interface{}) bool { + v, _ := Eval(expr, m).(bool) + return v +} + // Reduce evaluates expr using the available values in valuer. // References that don't exist in valuer are ignored. func Reduce(expr Expr, valuer Valuer) Expr { diff --git a/tsdb/cursor.go b/tsdb/cursor.go index b1f0e771fa..7fb2377084 100644 --- a/tsdb/cursor.go +++ b/tsdb/cursor.go @@ -3,6 +3,11 @@ package tsdb import ( "bytes" "container/heap" + "encoding/binary" + "sort" + "strings" + + "github.com/influxdb/influxdb/influxql" ) // Direction represents a cursor navigation direction. @@ -152,3 +157,274 @@ type cursorHeapItem struct { cursor Cursor priority int } + +// TagSetCursor is virtual cursor that iterates over mutiple series cursors, as though it were +// a single series. +type TagSetCursor struct { + measurement string // Measurement name + tags map[string]string // Tag key-value pairs + cursors []*seriesCursor // Underlying series cursors. + decoder *FieldCodec // decoder for the raw data bytes + currentTags map[string]string // the current tags for the underlying series cursor in play + + // pointHeap is a min-heap, ordered by timestamp, that contains the next + // point from each seriesCursor. Queries sometimes pull points from + // thousands of series. This makes it reasonably efficient to find the + // point with the next lowest timestamp among the thousands of series that + // the query is pulling points from. + // Performance profiling shows that this lookahead needs to be part + // of the TagSetCursor type and not part of the the cursors type. + pointHeap *pointHeap + + // Memomize the cursor's tagset-based key. Profiling shows that calculating this + // is significant CPU cost, and it only needs to be done once. + memokey string +} + +// TagSetCursors represents a sortable slice of TagSetCursors. +type TagSetCursors []*TagSetCursor + +func (a TagSetCursors) Len() int { return len(a) } +func (a TagSetCursors) Less(i, j int) bool { return a[i].key() < a[j].key() } +func (a TagSetCursors) Swap(i, j int) { a[i], a[j] = a[j], a[i] } + +func (a TagSetCursors) Keys() []string { + keys := []string{} + for i := range a { + keys = append(keys, a[i].key()) + } + sort.Strings(keys) + return keys +} + +// NewTagSetCursor returns a instance of TagSetCursor. +func NewTagSetCursor(m string, t map[string]string, c []*seriesCursor, d *FieldCodec) *TagSetCursor { + tsc := &TagSetCursor{ + measurement: m, + tags: t, + cursors: c, + decoder: d, + pointHeap: newPointHeap(), + } + + return tsc +} + +func (tsc *TagSetCursor) key() string { + if tsc.memokey == "" { + if len(tsc.tags) == 0 { + tsc.memokey = tsc.measurement + } else { + tsc.memokey = strings.Join([]string{tsc.measurement, string(MarshalTags(tsc.tags))}, "|") + } + } + return tsc.memokey +} + +func (tsc *TagSetCursor) SeekTo(seek int64) { + tsc.pointHeap = newPointHeap() + + // Prime the buffers. + for i := 0; i < len(tsc.cursors); i++ { + k, v := tsc.cursors[i].SeekTo(seek) + if k == -1 { + k, v = tsc.cursors[i].Next() + } + if k == -1 { + continue + } + + heap.Push(tsc.pointHeap, &pointHeapItem{ + timestamp: k, + value: v, + cursor: tsc.cursors[i], + }) + } +} + +// Next returns the next matching series-key, timestamp byte slice and meta tags for the tagset. Filtering +// is enforced on the values. If there is no matching value, then a nil result is returned. +func (tsc *TagSetCursor) Next(tmin, tmax int64, selectFields, whereFields []string) (int64, interface{}) { + for { + // If we're out of points, we're done. + if tsc.pointHeap.Len() == 0 { + return -1, nil + } + + // Grab the next point with the lowest timestamp. + p := heap.Pop(tsc.pointHeap).(*pointHeapItem) + + // We're done if the point is outside the query's time range [tmin:tmax). + if p.timestamp != tmin && (p.timestamp < tmin || p.timestamp >= tmax) { + return -1, nil + } + + // Decode the raw point. + value := tsc.decodeRawPoint(p, selectFields, whereFields) + timestamp := p.timestamp + + // Keep track of the current tags for the series cursor so we can + // respond with them if asked + tsc.currentTags = p.cursor.tags + + // Advance the cursor + nextKey, nextVal := p.cursor.Next() + if nextKey != -1 { + *p = pointHeapItem{ + timestamp: nextKey, + value: nextVal, + cursor: p.cursor, + } + heap.Push(tsc.pointHeap, p) + } + + // Value didn't match, look for the next one. + if value == nil { + continue + } + + return timestamp, value + } +} + +// Tags returns the current tags of the current cursor +// if there is no current currsor, it returns nil +func (tsc *TagSetCursor) Tags() map[string]string { + return tsc.currentTags +} + +// decodeRawPoint decodes raw point data into field names & values and does WHERE filtering. +func (tsc *TagSetCursor) decodeRawPoint(p *pointHeapItem, selectFields, whereFields []string) interface{} { + if len(selectFields) > 1 { + if fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value); err == nil { + // if there's a where clause, make sure we don't need to filter this value + if p.cursor.filter != nil && !influxql.EvalBool(p.cursor.filter, fieldsWithNames) { + return nil + } + + return fieldsWithNames + } + } + + // With only 1 field SELECTed, decoding all fields may be avoidable, which is faster. + value, err := tsc.decoder.DecodeByName(selectFields[0], p.value) + if err != nil { + return nil + } + + // If there's a WHERE clase, see if we need to filter + if p.cursor.filter != nil { + // See if the WHERE is only on this field or on one or more other fields. + // If the latter, we'll have to decode everything + if len(whereFields) == 1 && whereFields[0] == selectFields[0] { + if !influxql.EvalBool(p.cursor.filter, map[string]interface{}{selectFields[0]: value}) { + value = nil + } + } else { // Decode everything + fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value) + if err != nil || !influxql.EvalBool(p.cursor.filter, fieldsWithNames) { + value = nil + } + } + } + + return value +} + +type pointHeapItem struct { + timestamp int64 + value []byte + cursor *seriesCursor // cursor whence pointHeapItem came +} + +type pointHeap []*pointHeapItem + +func newPointHeap() *pointHeap { + q := make(pointHeap, 0) + heap.Init(&q) + return &q +} + +func (pq pointHeap) Len() int { return len(pq) } + +func (pq pointHeap) Less(i, j int) bool { + // We want a min-heap (points in chronological order), so use less than. + return pq[i].timestamp < pq[j].timestamp +} + +func (pq pointHeap) Swap(i, j int) { pq[i], pq[j] = pq[j], pq[i] } + +func (pq *pointHeap) Push(x interface{}) { + item := x.(*pointHeapItem) + *pq = append(*pq, item) +} + +func (pq *pointHeap) Pop() interface{} { + old := *pq + n := len(old) + item := old[n-1] + *pq = old[0 : n-1] + return item +} + +// seriesCursor is a cursor that walks a single series. It provides lookahead functionality. +type seriesCursor struct { + cursor Cursor // BoltDB cursor for a series + filter influxql.Expr + tags map[string]string + seekto int64 + seekResult struct { + k int64 + v []byte + } +} + +// newSeriesCursor returns a new instance of a series cursor. +func newSeriesCursor(cur Cursor, filter influxql.Expr, tags map[string]string) *seriesCursor { + return &seriesCursor{ + cursor: cur, + filter: filter, + tags: tags, + seekto: -1, + } +} + +// Seek positions returning the timestamp and value at that key. +func (sc *seriesCursor) SeekTo(key int64) (timestamp int64, value []byte) { + if sc.seekto != -1 && sc.seekto < key && (sc.seekResult.k == -1 || sc.seekResult.k >= key) { + // we've seeked on this cursor. This seek is after that previous cached seek + // and the result it gave was after the key for this seek. + // + // In this case, any seek would just return what we got before, so there's + // no point in reseeking. + return sc.seekResult.k, sc.seekResult.v + } + k, v := sc.cursor.Seek(u64tob(uint64(key))) + if k == nil { + timestamp = -1 + } else { + timestamp, value = int64(btou64(k)), v + } + sc.seekto = key + sc.seekResult.k = timestamp + sc.seekResult.v = v + return +} + +// Next returns the next timestamp and value from the cursor. +func (sc *seriesCursor) Next() (key int64, value []byte) { + // calling next on this cursor means that we need to invalidate the seek + sc.seekto = -1 + sc.seekResult.k = 0 + sc.seekResult.v = nil + k, v := sc.cursor.Next() + if k == nil { + key = -1 + } else { + key, value = int64(btou64(k)), v + } + return +} + +// btou64 converts an 8-byte slice into an uint64. +func btou64(b []byte) uint64 { return binary.BigEndian.Uint64(b) } diff --git a/tsdb/executor.go b/tsdb/executor.go index 78d65c9488..615ca3d6de 100644 --- a/tsdb/executor.go +++ b/tsdb/executor.go @@ -27,39 +27,6 @@ type Executor interface { Execute() <-chan *models.Row } -// Mapper is the interface all Mapper types must implement. -type Mapper interface { - Open() error - SetRemote(m Mapper) - TagSets() []string - Fields() []string - NextChunk() (interface{}, error) - Close() -} - -// StatefulMapper encapsulates a Mapper and some state that the executor needs to -// track for that mapper. -type StatefulMapper struct { - Mapper - bufferedChunk *MapperOutput // Last read chunk. - drained bool -} - -// NextChunk wraps a RawMapper and some state. -func (sm *StatefulMapper) NextChunk() (*MapperOutput, error) { - c, err := sm.Mapper.NextChunk() - if err != nil { - return nil, err - } - chunk, ok := c.(*MapperOutput) - if !ok { - if chunk == interface{}(nil) { - return nil, nil - } - } - return chunk, nil -} - type SelectExecutor struct { stmt *influxql.SelectStatement mappers []*StatefulMapper diff --git a/tsdb/functions.go b/tsdb/functions.go index 35b084f312..e33be8d339 100644 --- a/tsdb/functions.go +++ b/tsdb/functions.go @@ -36,7 +36,7 @@ type reduceFunc func([]interface{}) interface{} // UnmarshalFunc represents a function that can take bytes from a mapper from remote // server and marshal it into an interface the reducer can use -type unmarshalFunc func([]byte) (interface{}, error) +type UnmarshalFunc func([]byte) (interface{}, error) // initializemapFunc takes an aggregate call from the query and returns the mapFunc func initializeMapFunc(c *influxql.Call) (mapFunc, error) { @@ -149,7 +149,7 @@ func initializeReduceFunc(c *influxql.Call) (reduceFunc, error) { } } -func initializeUnmarshaller(c *influxql.Call) (unmarshalFunc, error) { +func InitializeUnmarshaller(c *influxql.Call) (UnmarshalFunc, error) { // if c is nil it's a raw data query if c == nil { return func(b []byte) (interface{}, error) { diff --git a/tsdb/mapper.go b/tsdb/mapper.go index 6baea3b084..f207d07795 100644 --- a/tsdb/mapper.go +++ b/tsdb/mapper.go @@ -2,16 +2,46 @@ package tsdb import ( "container/heap" - "encoding/binary" "encoding/json" "errors" "fmt" "sort" - "strings" "github.com/influxdb/influxdb/influxql" ) +// Mapper is the interface all Mapper types must implement. +type Mapper interface { + Open() error + TagSets() []string + Fields() []string + NextChunk() (interface{}, error) + Close() +} + +// StatefulMapper encapsulates a Mapper and some state that the executor needs to +// track for that mapper. +type StatefulMapper struct { + Mapper + bufferedChunk *MapperOutput // Last read chunk. + drained bool +} + +// NextChunk wraps a RawMapper and some state. +func (sm *StatefulMapper) NextChunk() (*MapperOutput, error) { + c, err := sm.Mapper.NextChunk() + if err != nil { + return nil, err + } + chunk, ok := c.(*MapperOutput) + if !ok { + if chunk == interface{}(nil) { + return nil, nil + } + } + return chunk, nil +} + // MapperValue is a complex type, which can encapsulate data from both raw and aggregate // mappers. This currently allows marshalling and network system to remain simpler. For // aggregate output Time is ignored, and actual Time-Value pairs are contained soley @@ -22,10 +52,10 @@ type MapperValue struct { Tags map[string]string `json:"tags,omitempty"` // Meta tags for results } -// MapperValueAsJSON is the JSON-encoded representation of MapperValue. Because MapperValue is +// MapperValueJSON is the JSON-encoded representation of MapperValue. Because MapperValue is // a complex type, custom JSON encoding is required so that none of the types contained within // a MapperValue are "lost", and so the data are encoded as byte slices where necessary. -type MapperValueAsJSON struct { +type MapperValueJSON struct { Time int64 `json:"time,omitempty"` RawData []byte `json:"rdata,omitempty"` AggData [][]byte `json:"adata,omitempty"` @@ -34,7 +64,7 @@ type MapperValueAsJSON struct { // MarshalJSON returns the JSON-encoded representation of a MapperValue. func (mv *MapperValue) MarshalJSON() ([]byte, error) { - o := &MapperValueAsJSON{ + o := &MapperValueJSON{ Time: mv.Time, AggData: make([][]byte, 0), Tags: mv.Tags, @@ -77,9 +107,9 @@ type MapperOutput struct { cursorKey string // Tagset-based key for the source cursor. Cached for performance reasons. } -// MapperOutputAsJSON is the JSON-encoded representation of MapperOutput. The query data is represented +// MapperOutputJSON is the JSON-encoded representation of MapperOutput. The query data is represented // as a raw JSON message, so decode is delayed, and can proceed in a custom manner. -type MapperOutputAsJSON struct { +type MapperOutputJSON struct { Name string `json:"name,omitempty"` Tags map[string]string `json:"tags,omitempty"` Fields []string `json:"fields,omitempty"` // Field names of returned data. @@ -88,7 +118,7 @@ type MapperOutputAsJSON struct { // MarshalJSON returns the JSON-encoded representation of a MapperOutput. func (mo *MapperOutput) MarshalJSON() ([]byte, error) { - o := &MapperOutputAsJSON{ + o := &MapperOutputJSON{ Name: mo.Name, Tags: mo.Tags, Fields: mo.Fields, @@ -106,359 +136,158 @@ func (mo *MapperOutput) key() string { return mo.cursorKey } -// SelectMapper is for retrieving data for a query, from a given shard. -type SelectMapper struct { - shard *Shard - remote Mapper - stmt *influxql.SelectStatement - rawMode bool - chunkSize int - tx Tx // Read transaction for this shard. - queryTMin int64 // Minimum time of the query. - queryTMax int64 // Maximum time of the query. - whereFields []string // field names that occur in the where clause - selectFields []string // field names that occur in the select clause - selectTags []string // tag keys that occur in the select clause - cursors []*tagSetCursor // Cursors per tag sets. - currCursorIndex int // Current tagset cursor being drained. +// RawMapper runs the map phase for non-aggregate, raw SELECT queries. +type RawMapper struct { + shard *Shard + stmt *influxql.SelectStatement + qmin, qmax int64 // query time range - // The following attributes are only used when mappers are for aggregate queries. + tx Tx + cursors []*TagSetCursor + cursorIndex int - queryTMinWindow int64 // Minimum time of the query floored to start of interval. - intervalSize int64 // Size of each interval. - numIntervals int // Maximum number of intervals to return. - currInterval int // Current interval for which data is being fetched. - mapFuncs []mapFunc // The mapping functions. - mapUnmarshallers []unmarshalFunc // Mapping-specific unmarshal functions. - fieldNames []string // the field name being read for mapping. + selectFields []string + selectTags []string + whereFields []string + + ChunkSize int } -// NewSelectMapper returns a mapper for the given shard, which will return data for the SELECT statement. -func NewSelectMapper(shard *Shard, stmt *influxql.SelectStatement, chunkSize int) *SelectMapper { - return &SelectMapper{ - shard: shard, - stmt: stmt, - chunkSize: chunkSize, - cursors: make([]*tagSetCursor, 0), +// NewRawMapper returns a new instance of RawMapper. +func NewRawMapper(sh *Shard, stmt *influxql.SelectStatement) *RawMapper { + return &RawMapper{ + shard: sh, + stmt: stmt, } } -func (lm *SelectMapper) timeDirection() Direction { - if len(lm.stmt.SortFields) > 0 { - if lm.stmt.SortFields[0].Ascending { - return Forward - } else { - return Reverse - } - } - return Forward -} - -// Open opens the Mapper for a SELECT Statement -func (lm *SelectMapper) Open() error { - // If in aggregate mode, initialize the map-and-reduce functions. Both local and - // remote mappers need this. - if !lm.rawMode { - if err := lm.initializeMapFunctions(); err != nil { - return err - } - } - - // If this mapper is actually responsible for accessing remote shard, initialize - // that and return. - if lm.remote != nil { - return lm.remote.Open() - } - - // This can happen when a shard has been assigned to this node but we have not - // written to it so it may not exist yet. - if lm.shard == nil { +// Open opens and initializes the mapper. +func (m *RawMapper) Open() error { + // Ignore if node has the shard but hasn't written to it yet. + if m.shard == nil { return nil } - // Get a read-only transaction. - tx, err := lm.shard.engine.Begin(false) + // Rewrite statement. + stmt, err := m.shard.index.RewriteSelectStatement(m.stmt) if err != nil { return err } - lm.tx = tx + m.stmt = stmt - if err := func() error { - stmt, err := lm.rewriteSelectStatement(lm.stmt) + // Set all time-related parameters on the mapper. + m.qmin, m.qmax = influxql.TimeRangeAsEpochNano(m.stmt.Condition) + + // Get a read-only transaction. + tx, err := m.shard.engine.Begin(false) + if err != nil { + return err + } + m.tx = tx + + selectFields := newStringSet() + selectTags := newStringSet() + whereFields := newStringSet() + + // Open cursors for each measurement. + for _, src := range m.stmt.Sources { + // Retrieve measurement index reference. Ignore if not exists. + mm := m.shard.index.Measurement(src.(*influxql.Measurement).Name) + if mm == nil { + continue + } + + // Open cursors for measurement. + info, err := m.openMeasurement(mm) if err != nil { return err } - lm.stmt = stmt - lm.rawMode = (stmt.IsRawQuery && !stmt.HasDistinct()) || stmt.IsSimpleDerivative() - // Set all time-related parameters on the mapper. - lm.queryTMin, lm.queryTMax = influxql.TimeRangeAsEpochNano(lm.stmt.Condition) + // Append fields & tags. + selectFields.add(info.SelectFields...) + selectTags.add(info.SelectTags...) + whereFields.add(info.WhereFields...) + } - if !lm.rawMode { - // For GROUP BY time queries, limit the number of data points returned by the limit and offset - d, err := lm.stmt.GroupByInterval() - if err != nil { - return err - } - lm.intervalSize = d.Nanoseconds() - if lm.queryTMin == 0 || lm.intervalSize == 0 { - lm.numIntervals = 1 - lm.intervalSize = lm.queryTMax - lm.queryTMin - } else { - intervalTop := lm.queryTMax/lm.intervalSize*lm.intervalSize + lm.intervalSize - intervalBottom := lm.queryTMin / lm.intervalSize * lm.intervalSize - lm.numIntervals = int((intervalTop - intervalBottom) / lm.intervalSize) - } + m.selectFields = selectFields.list() + m.selectTags = selectTags.list() + m.whereFields = whereFields.list() - if lm.stmt.Limit > 0 || lm.stmt.Offset > 0 { - // ensure that the offset isn't higher than the number of points we'd get - if lm.stmt.Offset > lm.numIntervals { - return nil - } - - // Take the lesser of either the pre computed number of GROUP BY buckets that - // will be in the result or the limit passed in by the user - if lm.stmt.Limit < lm.numIntervals { - lm.numIntervals = lm.stmt.Limit - } - } - - // If we are exceeding our MaxGroupByPoints error out - if lm.numIntervals > MaxGroupByPoints { - return errors.New("too many points in the group by interval. maybe you forgot to specify a where time clause?") - } - - // Ensure that the start time for the results is on the start of the window. - lm.queryTMinWindow = lm.queryTMin - if lm.intervalSize > 0 && lm.numIntervals > 1 { - lm.queryTMinWindow = lm.queryTMinWindow / lm.intervalSize * lm.intervalSize - } - } - - selectFields := newStringSet() - selectTags := newStringSet() - whereFields := newStringSet() - - // Create the TagSet cursors for the Mapper. - for _, src := range lm.stmt.Sources { - mm, ok := src.(*influxql.Measurement) - if !ok { - return fmt.Errorf("invalid source type: %#v", src) - } - - m := lm.shard.index.Measurement(mm.Name) - if m == nil { - // This shard have never received data for the measurement. No Mapper - // required. - return nil - } - - // Validate that ANY GROUP BY is not a field for the measurement. - if err := m.ValidateGroupBy(lm.stmt); err != nil { - return err - } - - // Create tagset cursors and determine various field types within SELECT statement. - tsf, err := createTagSetsAndFields(m, lm.stmt) - if err != nil { - return err - } - tagSets := tsf.tagSets - selectFields.add(tsf.selectFields...) - selectTags.add(tsf.selectTags...) - whereFields.add(tsf.whereFields...) - - // If we only have tags in our select clause we just return - if len(selectFields) == 0 && len(selectTags) > 0 { - return fmt.Errorf("statement must have at least one field in select clause") - } - - // Validate that any GROUP BY is not on a field - if err := m.ValidateGroupBy(lm.stmt); err != nil { - return err - } - - // SLIMIT and SOFFSET the unique series - if lm.stmt.SLimit > 0 || lm.stmt.SOffset > 0 { - if lm.stmt.SOffset > len(tagSets) { - tagSets = nil - } else { - if lm.stmt.SOffset+lm.stmt.SLimit > len(tagSets) { - lm.stmt.SLimit = len(tagSets) - lm.stmt.SOffset - } - - tagSets = tagSets[lm.stmt.SOffset : lm.stmt.SOffset+lm.stmt.SLimit] - } - } - - // For aggregate functions, we iterate the cursors in forward order but return the - // time bucket results in reverse order. This simplifies the aggregate code in that - // they do not need to hand forward and revers semantics. For raw queries, we do need - // iterate in reverse order if using order by time desc. - direction := Forward - if lm.rawMode { - direction = lm.timeDirection() - } - // Create all cursors for reading the data from this shard. - for _, t := range tagSets { - cursors := []*seriesCursor{} - - for i, key := range t.SeriesKeys { - c := lm.tx.Cursor(key, direction) - if c == nil { - // No data exists for this key. - continue - } - seriesTags := lm.shard.index.TagsForSeries(key) - cm := newSeriesCursor(c, t.Filters[i], seriesTags) - cursors = append(cursors, cm) - } - - tsc := newTagSetCursor(m.Name, t.Tags, cursors, lm.shard.FieldCodec(m.Name)) - if lm.rawMode { - tsc.pointHeap = newPointHeap() - //Prime the buffers. - for i := 0; i < len(tsc.cursors); i++ { - var k int64 - var v []byte - if direction.Forward() { - k, v = tsc.cursors[i].SeekTo(lm.queryTMin) - } else { - k, v = tsc.cursors[i].SeekTo(lm.queryTMax) - } - - if k == -1 { - k, v = tsc.cursors[i].Next() - } - - if k == -1 { - continue - } - p := &pointHeapItem{ - timestamp: k, - value: v, - cursor: tsc.cursors[i], - } - heap.Push(tsc.pointHeap, p) - } - } - lm.cursors = append(lm.cursors, tsc) - } - sort.Sort(tagSetCursors(lm.cursors)) - } - - lm.selectFields = selectFields.list() - lm.selectTags = selectTags.list() - lm.whereFields = whereFields.list() - - // If the query does not aggregate, then at least 1 SELECT field should be present. - if lm.rawMode && len(lm.selectFields) == 0 { - // None of the SELECT fields exist in this data. Wipe out all tagset cursors. - lm.cursors = nil - } - - return nil - }(); err != nil { - lm.tx.Rollback() - return err + // Remove cursors if no SELECT fields are present. + if len(m.selectFields) == 0 { + m.cursors = nil } return nil } -func (lm *SelectMapper) SetRemote(m Mapper) { lm.remote = m } +func (m *RawMapper) openMeasurement(mm *Measurement) (SelectInfo, error) { + // Validate and return selection info. + info, err := mm.ValidateSelectStatement(m.stmt) + if err != nil { + return info, err + } -func (lm *SelectMapper) NextChunk() (interface{}, error) { - // If set, use remote mapper. - if lm.remote != nil { - b, err := lm.remote.NextChunk() - if err != nil { - return nil, err - } else if b == nil { - return nil, nil - } + // Create all cursors for reading the data from this shard. + direction := Direction(m.stmt.TimeAscending()) + for _, t := range info.TagSets { + cursors := []*seriesCursor{} - moj := &MapperOutputAsJSON{} - if err := json.Unmarshal(b.([]byte), moj); err != nil { - return nil, err - } - mvj := []*MapperValueAsJSON{} - if err := json.Unmarshal(moj.Values, &mvj); err != nil { - return nil, err - } - - // Prep the non-JSON version of Mapper output. - mo := &MapperOutput{ - Name: moj.Name, - Tags: moj.Tags, - Fields: moj.Fields, - } - - if len(mvj) == 1 && len(mvj[0].AggData) > 0 { - // The MapperValue is carrying aggregate data, so run it through the - // custom unmarshallers for the map functions through which the data - // was mapped. - aggValues := []interface{}{} - for i, b := range mvj[0].AggData { - v, err := lm.mapUnmarshallers[i](b) - if err != nil { - return nil, err - } - aggValues = append(aggValues, v) + for i, key := range t.SeriesKeys { + c := m.tx.Cursor(key, direction) + if c == nil { + continue } - mv := &MapperValue{ - Value: aggValues, - Tags: mvj[0].Tags, - } - mo.Values = []*MapperValue{mv} + + seriesTags := m.shard.index.TagsForSeries(key) + cm := newSeriesCursor(c, t.Filters[i], seriesTags) + cursors = append(cursors, cm) + } + + tsc := NewTagSetCursor(mm.Name, t.Tags, cursors, m.shard.FieldCodec(mm.Name)) + if direction.Forward() { + tsc.SeekTo(m.qmin) } else { - // Must be raw data instead. - for _, v := range mvj { - var rawValue interface{} - err := json.Unmarshal(v.RawData, &rawValue) - if err != nil { - return nil, err - } - mv := &MapperValue{ - Time: v.Time, - Value: rawValue, - Tags: v.Tags, - } - if mo.Values == nil { - mo.Values = []*MapperValue{mv} - } else { - mo.Values = append(mo.Values, mv) - } - } + tsc.SeekTo(m.qmax) } - - return mo, nil + m.cursors = append(m.cursors, tsc) } - // Remote mapper not set so get values from local shard. - if lm.rawMode { - return lm.nextChunkRaw() - } + sort.Sort(TagSetCursors(m.cursors)) - return lm.nextChunkAgg() + return info, nil } -// nextChunkRaw returns the next chunk of data. Data comes in the same order as the -// tags return by TagSets. A chunk never contains data for more than 1 tagset. +// Close closes the mapper. +func (m *RawMapper) Close() { + if m != nil && m.tx != nil { + m.tx.Rollback() + } +} + +// TagSets returns the list of tag sets for which this mapper has data. +func (m *RawMapper) TagSets() []string { return TagSetCursors(m.cursors).Keys() } + +// Fields returns all SELECT fields. +func (m *RawMapper) Fields() []string { return append(m.selectFields, m.selectTags...) } + +// NextChunk returns the next chunk of data. +// Data is ordered the same as TagSets. Each chunk contains one tag set. // If there is no more data for any tagset, nil will be returned. -func (lm *SelectMapper) nextChunkRaw() (interface{}, error) { +func (m *RawMapper) NextChunk() (interface{}, error) { var output *MapperOutput for { - if lm.currCursorIndex == len(lm.cursors) { - // All tagset cursors processed. NextChunk'ing complete. + // All tagset cursors processed. NextChunk'ing complete. + if m.cursorIndex == len(m.cursors) { return nil, nil } - cursor := lm.cursors[lm.currCursorIndex] - k, v := cursor.Next(lm.queryTMin, lm.queryTMax, lm.selectFields, lm.whereFields) + cursor := m.cursors[m.cursorIndex] + + k, v := cursor.Next(m.qmin, m.qmax, m.selectFields, m.whereFields) if v == nil { // Tagset cursor is empty, move to next one. - lm.currCursorIndex++ + m.cursorIndex++ if output != nil { // There is data, so return it and continue when next called. return output, nil @@ -467,158 +296,202 @@ func (lm *SelectMapper) nextChunkRaw() (interface{}, error) { continue } } + if output == nil { output = &MapperOutput{ Name: cursor.measurement, Tags: cursor.tags, - Fields: lm.selectFields, + Fields: m.selectFields, cursorKey: cursor.key(), } } - value := &MapperValue{Time: k, Value: v, Tags: cursor.Tags()} - output.Values = append(output.Values, value) - if len(output.Values) == lm.chunkSize { + + output.Values = append(output.Values, &MapperValue{ + Time: k, + Value: v, + Tags: cursor.Tags(), + }) + + if len(output.Values) == m.ChunkSize { return output, nil } } } -// nextChunkAgg returns the next chunk of data, which is the next interval of data -// for the current tagset. Tagsets are always processed in the same order as that -// returned by AvailTagsSets(). When there is no more data for any tagset nil -// is returned. -func (lm *SelectMapper) nextChunkAgg() (interface{}, error) { - var output *MapperOutput - for { - if lm.currCursorIndex == len(lm.cursors) { - // All tagset cursors processed. NextChunk'ing complete. - return nil, nil - } - tsc := lm.cursors[lm.currCursorIndex] - tmin, tmax := lm.nextInterval() +// AggregateMapper runs the map phase for aggregate SELECT queries. +type AggregateMapper struct { + shard *Shard + stmt *influxql.SelectStatement + qmin, qmax int64 // query time range - if tmin < 0 { - // All intervals complete for this tagset. Move to the next tagset. - lm.currInterval = 0 - lm.currCursorIndex++ + tx Tx + cursors []*TagSetCursor + cursorIndex int + + interval int // Current interval for which data is being fetched. + intervalN int // Maximum number of intervals to return. + intervalSize int64 // Size of each interval. + qminWindow int64 // Minimum time of the query floored to start of interval. + + mapFuncs []mapFunc // The mapping functions. + fieldNames []string // the field name being read for mapping. + + selectFields []string + selectTags []string + whereFields []string +} + +// NewAggregateMapper returns a new instance of AggregateMapper. +func NewAggregateMapper(sh *Shard, stmt *influxql.SelectStatement) *AggregateMapper { + return &AggregateMapper{ + shard: sh, + stmt: stmt, + } +} + +// Open opens and initializes the mapper. +func (m *AggregateMapper) Open() error { + // Ignore if node has the shard but hasn't written to it yet. + if m.shard == nil { + return nil + } + + // Rewrite statement. + stmt, err := m.shard.index.RewriteSelectStatement(m.stmt) + if err != nil { + return err + } + m.stmt = stmt + + // Set all time-related parameters on the mapper. + m.qmin, m.qmax = influxql.TimeRangeAsEpochNano(m.stmt.Condition) + + if err := m.initializeMapFunctions(); err != nil { + return err + } + + // For GROUP BY time queries, limit the number of data points returned by the limit and offset + d, err := m.stmt.GroupByInterval() + if err != nil { + return err + } + + m.intervalSize = d.Nanoseconds() + if m.qmin == 0 || m.intervalSize == 0 { + m.intervalN = 1 + m.intervalSize = m.qmax - m.qmin + } else { + intervalTop := m.qmax/m.intervalSize*m.intervalSize + m.intervalSize + intervalBottom := m.qmin / m.intervalSize * m.intervalSize + m.intervalN = int((intervalTop - intervalBottom) / m.intervalSize) + } + + if m.stmt.Limit > 0 || m.stmt.Offset > 0 { + // ensure that the offset isn't higher than the number of points we'd get + if m.stmt.Offset > m.intervalN { + return nil + } + + // Take the lesser of either the pre computed number of GROUP BY buckets that + // will be in the result or the limit passed in by the user + if m.stmt.Limit < m.intervalN { + m.intervalN = m.stmt.Limit + } + } + + // If we are exceeding our MaxGroupByPoints error out + if m.intervalN > MaxGroupByPoints { + return errors.New("too many points in the group by interval. maybe you forgot to specify a where time clause?") + } + + // Ensure that the start time for the results is on the start of the window. + m.qminWindow = m.qmin + if m.intervalSize > 0 && m.intervalN > 1 { + m.qminWindow = m.qminWindow / m.intervalSize * m.intervalSize + } + + // Get a read-only transaction. + tx, err := m.shard.engine.Begin(false) + if err != nil { + return err + } + m.tx = tx + + selectFields := newStringSet() + selectTags := newStringSet() + whereFields := newStringSet() + + // Open cursors for each measurement. + for _, src := range m.stmt.Sources { + // Retrieve measurement index reference. Ignore if not exists. + mm := m.shard.index.Measurement(src.(*influxql.Measurement).Name) + if mm == nil { continue } - // Prep the return data for this tagset. This will hold data for a single interval - // for a single tagset. - if output == nil { - output = &MapperOutput{ - Name: tsc.measurement, - Tags: tsc.tags, - Fields: lm.selectFields, - Values: make([]*MapperValue, 1), - cursorKey: tsc.key(), - } - // Aggregate values only use the first entry in the Values field. Set the time - // to the start of the interval. - output.Values[0] = &MapperValue{ - Time: tmin, - Value: make([]interface{}, 0)} + // Open cursors for measurement. + info, err := m.openMeasurement(mm) + if err != nil { + return err } - // Always clamp tmin and tmax. This can happen as bucket-times are bucketed to the nearest - // interval. This is necessary to grab the "partial" buckets at the beginning and end of the time range - qmin := tmin - if qmin < lm.queryTMin { - qmin = lm.queryTMin - } - qmax := tmax - if qmax > lm.queryTMax { - // Need to offset by one nanosecond for the logic to work properly in the tagset cursor Next - qmax = lm.queryTMax + 1 - } - - tsc.pointHeap = newPointHeap() - for i := range lm.mapFuncs { - // Prime the tagset cursor for the start of the interval. This is not ideal, as - // it should really calculate the values all in 1 pass, but that would require - // changes to the mapper functions, which can come later. - // Prime the buffers. - for i := 0; i < len(tsc.cursors); i++ { - k, v := tsc.cursors[i].SeekTo(qmin) - if k == -1 || k > tmax { - continue - } - p := &pointHeapItem{ - timestamp: k, - value: v, - cursor: tsc.cursors[i], - } - heap.Push(tsc.pointHeap, p) - } - // Wrap the tagset cursor so it implements the mapping functions interface. - nextf := func() (_ int64, value interface{}) { - k, v := tsc.Next(qmin, qmax, []string{lm.fieldNames[i]}, lm.whereFields) - return k, v - } - - tagf := func() map[string]string { - return tsc.Tags() - } - - tminf := func() int64 { - if len(lm.stmt.Dimensions) == 0 { - return -1 - } - if !lm.stmt.HasTimeFieldSpecified() { - return tmin - } - return -1 - } - - tagSetCursor := &aggTagSetCursor{ - nextFunc: nextf, - tagsFunc: tagf, - tMinFunc: tminf, - } - - // Execute the map function which walks the entire interval, and aggregates - // the result. - values := output.Values[0].Value.([]interface{}) - output.Values[0].Value = append(values, lm.mapFuncs[i](tagSetCursor)) - } - return output, nil + // Append fields & tags. + selectFields.add(info.SelectFields...) + selectTags.add(info.SelectTags...) + whereFields.add(info.WhereFields...) } + + m.selectFields = selectFields.list() + m.selectTags = selectTags.list() + m.whereFields = whereFields.list() + + return nil } -// nextInterval returns the next interval for which to return data. If start is less than 0 -// there are no more intervals. -func (lm *SelectMapper) nextInterval() (start, end int64) { - t := lm.queryTMinWindow + int64(lm.currInterval+lm.stmt.Offset)*lm.intervalSize - - // Onto next interval. - lm.currInterval++ - if t > lm.queryTMax || lm.currInterval > lm.numIntervals { - start, end = -1, 1 - } else { - start, end = t, t+lm.intervalSize +func (m *AggregateMapper) openMeasurement(mm *Measurement) (SelectInfo, error) { + // Validate and return selection info. + info, err := mm.ValidateSelectStatement(m.stmt) + if err != nil { + return info, err } - return + + // Create all cursors for reading the data from this shard. + for _, t := range info.TagSets { + cursors := []*seriesCursor{} + + for i, key := range t.SeriesKeys { + c := m.tx.Cursor(key, Forward) + if c == nil { + continue + } + + seriesTags := m.shard.index.TagsForSeries(key) + cursors = append(cursors, newSeriesCursor(c, t.Filters[i], seriesTags)) + } + + tsc := NewTagSetCursor(mm.Name, t.Tags, cursors, m.shard.FieldCodec(mm.Name)) + tsc.SeekTo(m.qmin) + m.cursors = append(m.cursors, tsc) + } + + sort.Sort(TagSetCursors(m.cursors)) + + return info, nil } -// initializeMapFunctions initialize the mapping functions for the mapper. This only applies -// to aggregate queries -func (lm *SelectMapper) initializeMapFunctions() error { - var err error +// initializeMapFunctions initialize the mapping functions for the mapper. +func (m *AggregateMapper) initializeMapFunctions() error { // Set up each mapping function for this statement. - aggregates := lm.stmt.FunctionCalls() - lm.mapFuncs = make([]mapFunc, len(aggregates)) - lm.mapUnmarshallers = make([]unmarshalFunc, len(aggregates)) - lm.fieldNames = make([]string, len(lm.mapFuncs)) + aggregates := m.stmt.FunctionCalls() + m.mapFuncs = make([]mapFunc, len(aggregates)) + m.fieldNames = make([]string, len(m.mapFuncs)) + for i, c := range aggregates { - lm.mapFuncs[i], err = initializeMapFunc(c) - if err != nil { - return err - } - lm.mapUnmarshallers[i], err = initializeUnmarshaller(c) + mfn, err := initializeMapFunc(c) if err != nil { return err } + m.mapFuncs[i] = mfn // Check for calls like `derivative(lmean(value), 1d)` var nested *influxql.Call = c @@ -627,12 +500,12 @@ func (lm *SelectMapper) initializeMapFunctions() error { } switch lit := nested.Args[0].(type) { case *influxql.VarRef: - lm.fieldNames[i] = lit.Val + m.fieldNames[i] = lit.Val case *influxql.Distinct: if c.Name != "count" { return fmt.Errorf("aggregate call didn't contain a field %s", c.String()) } - lm.fieldNames[i] = lit.Val + m.fieldNames[i] = lit.Val default: return fmt.Errorf("aggregate call didn't contain a field %s", c.String()) } @@ -641,504 +514,150 @@ func (lm *SelectMapper) initializeMapFunctions() error { return nil } -// rewriteSelectStatement performs any necessary query re-writing. -func (lm *SelectMapper) rewriteSelectStatement(stmt *influxql.SelectStatement) (*influxql.SelectStatement, error) { - // Expand regex expressions in the FROM clause. - sources, err := expandSources(stmt.Sources, lm.shard.index) - if err != nil { - return nil, err - } - stmt.Sources = sources - - // Expand wildcards in the fields or GROUP BY. - stmt, err = lm.expandWildcards(stmt) - if err != nil { - return nil, err - } - - stmt.RewriteDistinct() - - return stmt, nil -} - -// expandWildcards returns a new SelectStatement with wildcards expanded -// If only a `SELECT *` is present, without a `GROUP BY *`, both tags and fields expand in the SELECT -// If a `SELECT *` and a `GROUP BY *` are both present, then only fiels are expanded in the `SELECT` and only -// tags are expanded in the `GROUP BY` -func (lm *SelectMapper) expandWildcards(stmt *influxql.SelectStatement) (*influxql.SelectStatement, error) { - // If there are no wildcards in the statement, return it as-is. - if !stmt.HasWildcard() { - return stmt, nil - } - // Use sets to avoid duplicate field names. - fieldSet := map[string]struct{}{} - dimensionSet := map[string]struct{}{} - var fields influxql.Fields - var dimensions influxql.Dimensions - - // keep track of where the wildcards are in the select statement - hasFieldWildcard := stmt.HasFieldWildcard() - hasDimensionWildcard := stmt.HasDimensionWildcard() - - // Iterate measurements in the FROM clause getting the fields & dimensions for each. - for _, src := range stmt.Sources { - if m, ok := src.(*influxql.Measurement); ok { - // Lookup the measurement in the database. - mm := lm.shard.index.Measurement(m.Name) - if mm == nil { - // This shard have never received data for the measurement. No Mapper - // required. - return stmt, nil - } - // Get the fields for this measurement. - for _, name := range mm.FieldNames() { - if _, ok := fieldSet[name]; ok { - continue - } - fieldSet[name] = struct{}{} - fields = append(fields, &influxql.Field{Expr: &influxql.VarRef{Val: name}}) - } - - // Add tags to fields if a field wildcard was provided and a dimension wildcard was not. - if hasFieldWildcard && !hasDimensionWildcard { - for _, t := range mm.TagKeys() { - if _, ok := fieldSet[t]; ok { - continue - } - fieldSet[t] = struct{}{} - fields = append(fields, &influxql.Field{Expr: &influxql.VarRef{Val: t}}) - } - } - - // Get the dimensions for this measurement. - if hasDimensionWildcard { - for _, t := range mm.TagKeys() { - if _, ok := dimensionSet[t]; ok { - continue - } - dimensionSet[t] = struct{}{} - dimensions = append(dimensions, &influxql.Dimension{Expr: &influxql.VarRef{Val: t}}) - } - } - } - } - - // Return a new SelectStatement with the wild cards rewritten. - return stmt.RewriteWildcards(fields, dimensions), nil -} - -// TagSets returns the list of TagSets for which this mapper has data. -func (lm *SelectMapper) TagSets() []string { - if lm.remote != nil { - return lm.remote.TagSets() - } - return tagSetCursors(lm.cursors).Keys() -} - -// Fields returns any SELECT fields. If this Mapper is not processing a SELECT query -// then an empty slice is returned. -func (lm *SelectMapper) Fields() []string { - if lm.remote != nil { - return lm.remote.Fields() - } - return append(lm.selectFields, lm.selectTags...) -} - // Close closes the mapper. -func (lm *SelectMapper) Close() { - if lm.remote != nil { - lm.remote.Close() - return - } - if lm != nil && lm.tx != nil { - _ = lm.tx.Rollback() +func (m *AggregateMapper) Close() { + if m != nil && m.tx != nil { + m.tx.Rollback() } + return } -// aggTagSetCursor wraps a standard tagSetCursor, such that the values it emits are aggregated -// by intervals. -type aggTagSetCursor struct { - nextFunc func() (time int64, value interface{}) - tagsFunc func() map[string]string - tMinFunc func() int64 -} +// TagSets returns the list of tag sets for which this mapper has data. +func (m *AggregateMapper) TagSets() []string { return TagSetCursors(m.cursors).Keys() } -// Next returns the next value for the aggTagSetCursor. It implements the interface expected -// by the mapping functions. -func (a *aggTagSetCursor) Next() (time int64, value interface{}) { - return a.nextFunc() -} +// Fields returns all SELECT fields. +func (m *AggregateMapper) Fields() []string { return append(m.selectFields, m.selectTags...) } -// Tags returns the current tags for the cursor -func (a *aggTagSetCursor) Tags() map[string]string { - return a.tagsFunc() -} - -// TMin returns the current floor time for the bucket being worked on -func (a *aggTagSetCursor) TMin() int64 { - return a.tMinFunc() -} - -type pointHeapItem struct { - timestamp int64 - value []byte - cursor *seriesCursor // cursor whence pointHeapItem came -} - -type pointHeap []*pointHeapItem - -func newPointHeap() *pointHeap { - q := make(pointHeap, 0) - heap.Init(&q) - return &q -} - -func (pq pointHeap) Len() int { return len(pq) } - -func (pq pointHeap) Less(i, j int) bool { - // We want a min-heap (points in chronological order), so use less than. - return pq[i].timestamp < pq[j].timestamp -} - -func (pq pointHeap) Swap(i, j int) { pq[i], pq[j] = pq[j], pq[i] } - -func (pq *pointHeap) Push(x interface{}) { - item := x.(*pointHeapItem) - *pq = append(*pq, item) -} - -func (pq *pointHeap) Pop() interface{} { - old := *pq - n := len(old) - item := old[n-1] - *pq = old[0 : n-1] - return item -} - -// tagSetCursor is virtual cursor that iterates over mutiple series cursors, as though it were -// a single series. -type tagSetCursor struct { - measurement string // Measurement name - tags map[string]string // Tag key-value pairs - cursors []*seriesCursor // Underlying series cursors. - decoder *FieldCodec // decoder for the raw data bytes - currentTags map[string]string // the current tags for the underlying series cursor in play - - // pointHeap is a min-heap, ordered by timestamp, that contains the next - // point from each seriesCursor. Queries sometimes pull points from - // thousands of series. This makes it reasonably efficient to find the - // point with the next lowest timestamp among the thousands of series that - // the query is pulling points from. - // Performance profiling shows that this lookahead needs to be part - // of the tagSetCursor type and not part of the the cursors type. - pointHeap *pointHeap - - // Memomize the cursor's tagset-based key. Profiling shows that calculating this - // is significant CPU cost, and it only needs to be done once. - memokey string -} - -// tagSetCursors represents a sortable slice of tagSetCursors. -type tagSetCursors []*tagSetCursor - -func (a tagSetCursors) Len() int { return len(a) } -func (a tagSetCursors) Less(i, j int) bool { return a[i].key() < a[j].key() } -func (a tagSetCursors) Swap(i, j int) { a[i], a[j] = a[j], a[i] } - -func (a tagSetCursors) Keys() []string { - keys := []string{} - for i := range a { - keys = append(keys, a[i].key()) - } - sort.Strings(keys) - return keys -} - -// newTagSetCursor returns a tagSetCursor -func newTagSetCursor(m string, t map[string]string, c []*seriesCursor, d *FieldCodec) *tagSetCursor { - tsc := &tagSetCursor{ - measurement: m, - tags: t, - cursors: c, - decoder: d, - pointHeap: newPointHeap(), - } - - return tsc -} - -func (tsc *tagSetCursor) key() string { - if tsc.memokey == "" { - tsc.memokey = formMeasurementTagSetKey(tsc.measurement, tsc.tags) - } - return tsc.memokey -} - -// Next returns the next matching series-key, timestamp byte slice and meta tags for the tagset. Filtering -// is enforced on the values. If there is no matching value, then a nil result is returned. -func (tsc *tagSetCursor) Next(tmin, tmax int64, selectFields, whereFields []string) (int64, interface{}) { +// NextChunk returns the next interval of data. +// Tagsets are always processed in the same order as AvailTagsSets(). +// When there is no more data for any tagset nil is returned. +func (m *AggregateMapper) NextChunk() (interface{}, error) { + var tmin, tmax int64 for { - // If we're out of points, we're done. - if tsc.pointHeap.Len() == 0 { - return -1, nil + // All tagset cursors processed. NextChunk'ing complete. + if m.cursorIndex == len(m.cursors) { + return nil, nil } - // Grab the next point with the lowest timestamp. - p := heap.Pop(tsc.pointHeap).(*pointHeapItem) - - // We're done if the point is outside the query's time range [tmin:tmax). - if p.timestamp != tmin && (p.timestamp < tmin || p.timestamp >= tmax) { - return -1, nil + // All intervals complete for this tagset. Move to the next tagset. + tmin, tmax = m.nextInterval() + if tmin < 0 { + m.interval = 0 + m.cursorIndex++ + continue } + break + } - // Decode the raw point. - value := tsc.decodeRawPoint(p, selectFields, whereFields) - timestamp := p.timestamp + // Prep the return data for this tagset. + // This will hold data for a single interval for a single tagset. + tsc := m.cursors[m.cursorIndex] + output := &MapperOutput{ + Name: tsc.measurement, + Tags: tsc.tags, + Fields: m.selectFields, + Values: make([]*MapperValue, 1), + cursorKey: tsc.key(), + } - // Keep track of the current tags for the series cursor so we can - // respond with them if asked - tsc.currentTags = p.cursor.tags + // Aggregate values only use the first entry in the Values field. + // Set the time to the start of the interval. + output.Values[0] = &MapperValue{ + Time: tmin, + Value: make([]interface{}, 0), + } - // Advance the cursor - nextKey, nextVal := p.cursor.Next() - if nextKey != -1 { - *p = pointHeapItem{ - timestamp: nextKey, - value: nextVal, - cursor: p.cursor, + // Always clamp tmin and tmax. This can happen as bucket-times are bucketed to the nearest + // interval. This is necessary to grab the "partial" buckets at the beginning and end of the time range + qmin, qmax := tmin, tmax + if qmin < m.qmin { + qmin = m.qmin + } + if qmax > m.qmax { + qmax = m.qmax + 1 + } + + tsc.pointHeap = newPointHeap() + for i := range m.mapFuncs { + // Prime the tagset cursor for the start of the interval. This is not ideal, as + // it should really calculate the values all in 1 pass, but that would require + // changes to the mapper functions, which can come later. + // Prime the buffers. + for i := 0; i < len(tsc.cursors); i++ { + k, v := tsc.cursors[i].SeekTo(qmin) + if k == -1 || k > tmax { + continue + } + p := &pointHeapItem{ + timestamp: k, + value: v, + cursor: tsc.cursors[i], } heap.Push(tsc.pointHeap, p) } - // Value didn't match, look for the next one. - if value == nil { - continue - } + // Execute the map function which walks the entire interval, and aggregates the result. + output.Values[0].Value = append( + output.Values[0].Value.([]interface{}), + m.mapFuncs[i](&AggregateTagSetCursor{ + cursor: tsc, + tmin: tmin, + stmt: m.stmt, - return timestamp, value + qmin: qmin, + qmax: qmax, + + selectFields: []string{m.fieldNames[i]}, + whereFields: m.whereFields, + }), + ) } + + return output, nil } -// Tags returns the current tags of the current cursor -// if there is no current currsor, it returns nil -func (tsc *tagSetCursor) Tags() map[string]string { - return tsc.currentTags -} +// nextInterval returns the next interval for which to return data. +// If start is less than 0 there are no more intervals. +func (m *AggregateMapper) nextInterval() (start, end int64) { + t := m.qminWindow + int64(m.interval+m.stmt.Offset)*m.intervalSize -// decodeRawPoint decodes raw point data into field names & values and does WHERE filtering. -func (tsc *tagSetCursor) decodeRawPoint(p *pointHeapItem, selectFields, whereFields []string) interface{} { - if len(selectFields) > 1 { - if fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value); err == nil { - // if there's a where clause, make sure we don't need to filter this value - if p.cursor.filter != nil && !matchesWhere(p.cursor.filter, fieldsWithNames) { - return nil - } - - return fieldsWithNames - } - } - - // With only 1 field SELECTed, decoding all fields may be avoidable, which is faster. - value, err := tsc.decoder.DecodeByName(selectFields[0], p.value) - if err != nil { - return nil - } - - // If there's a WHERE clase, see if we need to filter - if p.cursor.filter != nil { - // See if the WHERE is only on this field or on one or more other fields. - // If the latter, we'll have to decode everything - if len(whereFields) == 1 && whereFields[0] == selectFields[0] { - if !matchesWhere(p.cursor.filter, map[string]interface{}{selectFields[0]: value}) { - value = nil - } - } else { // Decode everything - fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value) - if err != nil || !matchesWhere(p.cursor.filter, fieldsWithNames) { - value = nil - } - } - } - - return value -} - -// seriesCursor is a cursor that walks a single series. It provides lookahead functionality. -type seriesCursor struct { - cursor Cursor // BoltDB cursor for a series - filter influxql.Expr - tags map[string]string - seekto int64 - seekResult struct { - k int64 - v []byte - } -} - -// newSeriesCursor returns a new instance of a series cursor. -func newSeriesCursor(cur Cursor, filter influxql.Expr, tags map[string]string) *seriesCursor { - return &seriesCursor{ - cursor: cur, - filter: filter, - tags: tags, - seekto: -1, - } -} - -// Seek positions returning the timestamp and value at that key. -func (sc *seriesCursor) SeekTo(key int64) (timestamp int64, value []byte) { - if sc.seekto != -1 && sc.seekto < key && (sc.seekResult.k == -1 || sc.seekResult.k >= key) { - // we've seeked on this cursor. This seek is after that previous cached seek - // and the result it gave was after the key for this seek. - // - // In this case, any seek would just return what we got before, so there's - // no point in reseeking. - return sc.seekResult.k, sc.seekResult.v - } - k, v := sc.cursor.Seek(u64tob(uint64(key))) - if k == nil { - timestamp = -1 + // On to next interval. + m.interval++ + if t > m.qmax || m.interval > m.intervalN { + start, end = -1, 1 } else { - timestamp, value = int64(btou64(k)), v - } - sc.seekto = key - sc.seekResult.k = timestamp - sc.seekResult.v = v - return -} - -// Next returns the next timestamp and value from the cursor. -func (sc *seriesCursor) Next() (key int64, value []byte) { - // calling next on this cursor means that we need to invalidate the seek - sc.seekto = -1 - sc.seekResult.k = 0 - sc.seekResult.v = nil - k, v := sc.cursor.Next() - if k == nil { - key = -1 - } else { - key, value = int64(btou64(k)), v + start, end = t, t+m.intervalSize } return } -type tagSetsAndFields struct { - tagSets []*influxql.TagSet +// AggregateTagSetCursor wraps a standard tagSetCursor, such that the values it emits are aggregated by intervals. +type AggregateTagSetCursor struct { + cursor *TagSetCursor + + tmin int64 + stmt *influxql.SelectStatement + + qmin, qmax int64 selectFields []string - selectTags []string whereFields []string } -// expandSources expands regex sources and removes duplicates. -// NOTE: sources must be normalized (db and rp set) before calling this function. -func expandSources(sources influxql.Sources, di *DatabaseIndex) (influxql.Sources, error) { - // Use a map as a set to prevent duplicates. Two regexes might produce - // duplicates when expanded. - set := map[string]influxql.Source{} - names := []string{} - // Iterate all sources, expanding regexes when they're found. - for _, source := range sources { - switch src := source.(type) { - case *influxql.Measurement: - if src.Regex == nil { - name := src.String() - set[name] = src - names = append(names, name) - continue - } - // Get measurements from the database that match the regex. - measurements := di.measurementsByRegex(src.Regex.Val) - // Add those measurements to the set. - for _, m := range measurements { - m2 := &influxql.Measurement{ - Database: src.Database, - RetentionPolicy: src.RetentionPolicy, - Name: m.Name, - } - name := m2.String() - if _, ok := set[name]; !ok { - set[name] = m2 - names = append(names, name) - } - } - default: - return nil, fmt.Errorf("expandSources: unsuported source type: %T", source) - } - } - // Sort the list of source names. - sort.Strings(names) - // Convert set to a list of Sources. - expanded := make(influxql.Sources, 0, len(set)) - for _, name := range names { - expanded = append(expanded, set[name]) - } - return expanded, nil +// Next returns the next aggregate value for the cursor. +func (a *AggregateTagSetCursor) Next() (time int64, value interface{}) { + return a.cursor.Next(a.qmin, a.qmax, a.selectFields, a.whereFields) } -// createTagSetsAndFields returns the tagsets and various fields given a measurement and -// SELECT statement. -func createTagSetsAndFields(m *Measurement, stmt *influxql.SelectStatement) (*tagSetsAndFields, error) { - _, tagKeys := stmt.Dimensions.Normalize() +// Tags returns the current tags for the cursor +func (a *AggregateTagSetCursor) Tags() map[string]string { return a.cursor.Tags() } - sfs := newStringSet() - sts := newStringSet() - wfs := newStringSet() - - // Validate the fields and tags asked for exist and keep track of which are in the select vs the where - for _, n := range stmt.NamesInSelect() { - if m.HasField(n) { - sfs.add(n) - continue - } - if m.HasTagKey(n) { - sts.add(n) - } +// TMin returns the current floor time for the bucket being worked on +func (a *AggregateTagSetCursor) TMin() int64 { + if len(a.stmt.Dimensions) == 0 { + return -1 } - - for _, n := range stmt.NamesInDimension() { - if m.HasTagKey(n) { - tagKeys = append(tagKeys, n) - } + if !a.stmt.HasTimeFieldSpecified() { + return a.tmin } - - for _, n := range stmt.NamesInWhere() { - if n == "time" { - continue - } - if m.HasField(n) { - wfs.add(n) - continue - } - } - - // Get the sorted unique tag sets for this statement. - tagSets, err := m.TagSets(stmt, tagKeys) - if err != nil { - return nil, err - } - - return &tagSetsAndFields{ - tagSets: tagSets, - selectFields: sfs.list(), - selectTags: sts.list(), - whereFields: wfs.list(), - }, nil + return -1 } - -// matchesFilter returns true if the value matches the where clause -func matchesWhere(f influxql.Expr, fields map[string]interface{}) bool { - if ok, _ := influxql.Eval(f, fields).(bool); !ok { - return false - } - return true -} - -func formMeasurementTagSetKey(name string, tags map[string]string) string { - if len(tags) == 0 { - return name - } - return strings.Join([]string{name, string(MarshalTags(tags))}, "|") -} - -// btou64 converts an 8-byte slice into an uint64. -func btou64(b []byte) uint64 { return binary.BigEndian.Uint64(b) } diff --git a/tsdb/mapper_test.go b/tsdb/mapper_test.go index d3c6bc2297..5b3ac3989a 100644 --- a/tsdb/mapper_test.go +++ b/tsdb/mapper_test.go @@ -416,7 +416,7 @@ func TestShardMapper_WriteAndSingleMapperAggregateQuery(t *testing.T) { for _, tt := range tests { stmt := mustParseSelectStatement(tt.stmt) - mapper := openSelectMapperOrFail(t, shard, stmt) + mapper := openAggregateMapperOrFail(t, shard, stmt) for i := range tt.expected { got := aggIntervalAsJson(t, mapper) @@ -491,7 +491,7 @@ func TestShardMapper_SelectMapperTagSetsFields(t *testing.T) { for _, tt := range tests { stmt := mustParseSelectStatement(tt.stmt) - mapper := openSelectMapperOrFail(t, shard, stmt) + mapper := openAggregateMapperOrFail(t, shard, stmt) fields := mapper.Fields() if !reflect.DeepEqual(fields, tt.expectedFields) { @@ -537,12 +537,12 @@ func mustParseStatement(s string) influxql.Statement { } func openRawMapperOrFail(t *testing.T, shard *tsdb.Shard, stmt *influxql.SelectStatement, chunkSize int) tsdb.Mapper { - mapper := tsdb.NewSelectMapper(shard, stmt, chunkSize) - - if err := mapper.Open(); err != nil { + m := tsdb.NewRawMapper(shard, stmt) + m.ChunkSize = chunkSize + if err := m.Open(); err != nil { t.Fatalf("failed to open raw mapper: %s", err.Error()) } - return mapper + return m } func nextRawChunkAsJson(t *testing.T, mapper tsdb.Mapper) string { @@ -553,16 +553,15 @@ func nextRawChunkAsJson(t *testing.T, mapper tsdb.Mapper) string { return mustMarshalMapperOutput(r) } -func openSelectMapperOrFail(t *testing.T, shard *tsdb.Shard, stmt *influxql.SelectStatement) *tsdb.SelectMapper { - mapper := tsdb.NewSelectMapper(shard, stmt, 0) - - if err := mapper.Open(); err != nil { +func openAggregateMapperOrFail(t *testing.T, shard *tsdb.Shard, stmt *influxql.SelectStatement) *tsdb.AggregateMapper { + m := tsdb.NewAggregateMapper(shard, stmt) + if err := m.Open(); err != nil { t.Fatalf("failed to open aggregate mapper: %s", err.Error()) } - return mapper + return m } -func aggIntervalAsJson(t *testing.T, mapper *tsdb.SelectMapper) string { +func aggIntervalAsJson(t *testing.T, mapper *tsdb.AggregateMapper) string { r, err := mapper.NextChunk() if err != nil { t.Fatalf("failed to get next chunk from aggregate mapper: %s", err.Error()) diff --git a/tsdb/meta.go b/tsdb/meta.go index 8a1fec53d3..1f3a4dd789 100644 --- a/tsdb/meta.go +++ b/tsdb/meta.go @@ -282,6 +282,142 @@ func (db *DatabaseIndex) DropSeries(keys []string) { } } +// RewriteSelectStatement performs any necessary query re-writing. +func (db *DatabaseIndex) RewriteSelectStatement(stmt *influxql.SelectStatement) (*influxql.SelectStatement, error) { + // Expand regex expressions in the FROM clause. + sources, err := db.ExpandSources(stmt.Sources) + if err != nil { + return nil, err + } + stmt.Sources = sources + + // Expand wildcards in the fields or GROUP BY. + stmt, err = db.ExpandWildcards(stmt) + if err != nil { + return nil, err + } + + stmt.RewriteDistinct() + + return stmt, nil +} + +// expandWildcards returns a new SelectStatement with wildcards expanded +// If only a `SELECT *` is present, without a `GROUP BY *`, both tags and fields expand in the SELECT +// If a `SELECT *` and a `GROUP BY *` are both present, then only fiels are expanded in the `SELECT` and only +// tags are expanded in the `GROUP BY` +func (db *DatabaseIndex) ExpandWildcards(stmt *influxql.SelectStatement) (*influxql.SelectStatement, error) { + // If there are no wildcards in the statement, return it as-is. + if !stmt.HasWildcard() { + return stmt, nil + } + // Use sets to avoid duplicate field names. + fieldSet := map[string]struct{}{} + dimensionSet := map[string]struct{}{} + + // keep track of where the wildcards are in the select statement + hasFieldWildcard := stmt.HasFieldWildcard() + hasDimensionWildcard := stmt.HasDimensionWildcard() + + // Iterate measurements in the FROM clause getting the fields & dimensions for each. + var fields influxql.Fields + var dimensions influxql.Dimensions + for _, src := range stmt.Sources { + if m, ok := src.(*influxql.Measurement); ok { + // Lookup the measurement in the database. + mm := db.Measurement(m.Name) + if mm == nil { + // This shard have never received data for the measurement. No Mapper + // required. + return stmt, nil + } + + // Get the fields for this measurement. + for _, name := range mm.FieldNames() { + if _, ok := fieldSet[name]; ok { + continue + } + fieldSet[name] = struct{}{} + fields = append(fields, &influxql.Field{Expr: &influxql.VarRef{Val: name}}) + } + + // Add tags to fields if a field wildcard was provided and a dimension wildcard was not. + if hasFieldWildcard && !hasDimensionWildcard { + for _, t := range mm.TagKeys() { + if _, ok := fieldSet[t]; ok { + continue + } + fieldSet[t] = struct{}{} + fields = append(fields, &influxql.Field{Expr: &influxql.VarRef{Val: t}}) + } + } + + // Get the dimensions for this measurement. + if hasDimensionWildcard { + for _, t := range mm.TagKeys() { + if _, ok := dimensionSet[t]; ok { + continue + } + dimensionSet[t] = struct{}{} + dimensions = append(dimensions, &influxql.Dimension{Expr: &influxql.VarRef{Val: t}}) + } + } + } + } + + // Return a new SelectStatement with the wild cards rewritten. + return stmt.RewriteWildcards(fields, dimensions), nil +} + +// expandSources expands regex sources and removes duplicates. +// NOTE: sources must be normalized (db and rp set) before calling this function. +func (di *DatabaseIndex) ExpandSources(sources influxql.Sources) (influxql.Sources, error) { + // Use a map as a set to prevent duplicates. Two regexes might produce + // duplicates when expanded. + set := map[string]influxql.Source{} + names := []string{} + + // Iterate all sources, expanding regexes when they're found. + for _, source := range sources { + switch src := source.(type) { + case *influxql.Measurement: + if src.Regex == nil { + name := src.String() + set[name] = src + names = append(names, name) + continue + } + // Get measurements from the database that match the regex. + measurements := di.measurementsByRegex(src.Regex.Val) + // Add those measurements to the set. + for _, m := range measurements { + m2 := &influxql.Measurement{ + Database: src.Database, + RetentionPolicy: src.RetentionPolicy, + Name: m.Name, + } + name := m2.String() + if _, ok := set[name]; !ok { + set[name] = m2 + names = append(names, name) + } + } + default: + return nil, fmt.Errorf("expandSources: unsuported source type: %T", source) + } + } + + // Sort the list of source names. + sort.Strings(names) + + // Convert set to a list of Sources. + expanded := make(influxql.Sources, 0, len(set)) + for _, name := range names { + expanded = append(expanded, set[name]) + } + return expanded, nil +} + // Measurement represents a collection of time series in a database. It also contains in memory // structures for indexing tags. Exported functions are goroutine safe while un-exported functions // assume the caller will use the appropriate locks @@ -903,6 +1039,117 @@ func (m *Measurement) uniqueTagValues(expr influxql.Expr) map[string][]string { return out } +// ValidateSelectStatement validates stmt against m. Also returns a list of fields & tagsets. +func (m *Measurement) ValidateSelectStatement(stmt *influxql.SelectStatement) (SelectInfo, error) { + var info SelectInfo + + // Validate that ANY GROUP BY is not a field for the measurement. + if err := m.ValidateGroupBy(stmt); err != nil { + return info, err + } + + // Validate the fields and tags asked for exist and keep track of which are in the select vs the where + info.SelectFields = m.SelectFields(stmt) + info.SelectTags = m.SelectTags(stmt) + info.WhereFields = m.WhereFields(stmt) + + tagSets, err := m.DimensionTagSets(stmt) + if err != nil { + return info, err + } + info.TagSets = tagSets + + // return &tagSetsAndFields{ + // tagSets: tagSets, + // selectFields: sfs.list(), + // selectTags: sts.list(), + // whereFields: wfs.list(), + // }, nil + + // tagSets := tsf.tagSets + // selectFields.add(tsf.selectFields...) + // selectTags.add(tsf.selectTags...) + // whereFields.add(tsf.whereFields...) + + // If we only have tags in our select clause we just return + if len(info.SelectFields) == 0 && len(info.SelectTags) > 0 { + return info, fmt.Errorf("statement must have at least one field in select clause") + } + + // SLIMIT and SOFFSET the unique series + if stmt.SLimit > 0 || stmt.SOffset > 0 { + if stmt.SOffset > len(info.TagSets) { + info.TagSets = nil + } else { + if stmt.SOffset+stmt.SLimit > len(info.TagSets) { + stmt.SLimit = len(info.TagSets) - stmt.SOffset + } + info.TagSets = info.TagSets[stmt.SOffset : stmt.SOffset+stmt.SLimit] + } + } + + return info, nil +} + +// SelectFields returns a list of fields in the SELECT section of stmt. +func (m *Measurement) SelectFields(stmt *influxql.SelectStatement) []string { + set := newStringSet() + for _, name := range stmt.NamesInSelect() { + if m.HasField(name) { + set.add(name) + continue + } + } + return set.list() +} + +// SelectTags returns a list of non-field tags in the SELECT section of stmt. +func (m *Measurement) SelectTags(stmt *influxql.SelectStatement) []string { + set := newStringSet() + for _, name := range stmt.NamesInSelect() { + if !m.HasField(name) && m.HasTagKey(name) { + set.add(name) + } + } + return set.list() +} + +// WhereFields returns a list of non-"time" fields in the WHERE section of stmt. +func (m *Measurement) WhereFields(stmt *influxql.SelectStatement) []string { + set := newStringSet() + for _, name := range stmt.NamesInWhere() { + if name != "time" && m.HasField(name) { + set.add(name) + } + } + return set.list() +} + +// DimensionTagSets returns list of tag sets from the GROUP BY section of stmt. +func (m *Measurement) DimensionTagSets(stmt *influxql.SelectStatement) ([]*influxql.TagSet, error) { + _, tagKeys := stmt.Dimensions.Normalize() + + for _, n := range stmt.NamesInDimension() { + if m.HasTagKey(n) { + tagKeys = append(tagKeys, n) + } + } + + // Get the sorted unique tag sets for this statement. + tagSets, err := m.TagSets(stmt, tagKeys) + if err != nil { + return nil, err + } + return tagSets, nil +} + +type SelectInfo struct { + TagSets []*influxql.TagSet + SelectFields []string + SelectTags []string + WhereFields []string +} + // Measurements represents a list of *Measurement. type Measurements []*Measurement diff --git a/tsdb/show_measurements.go b/tsdb/show_measurements.go index 4aa5e8f002..690c92728a 100644 --- a/tsdb/show_measurements.go +++ b/tsdb/show_measurements.go @@ -120,19 +120,19 @@ func (e *ShowMeasurementsExecutor) close() { // ShowMeasurementsMapper is a mapper for collecting measurement names from a shard. type ShowMeasurementsMapper struct { - remote Mapper - shard *Shard - stmt *influxql.ShowMeasurementsStatement - chunkSize int - state interface{} + remote Mapper + shard *Shard + stmt *influxql.ShowMeasurementsStatement + state interface{} + + ChunkSize int } // NewShowMeasurementsMapper returns a mapper for the given shard, which will return data for the meta statement. -func NewShowMeasurementsMapper(shard *Shard, stmt *influxql.ShowMeasurementsStatement, chunkSize int) *ShowMeasurementsMapper { +func NewShowMeasurementsMapper(shard *Shard, stmt *influxql.ShowMeasurementsStatement) *ShowMeasurementsMapper { return &ShowMeasurementsMapper{ - shard: shard, - stmt: stmt, - chunkSize: chunkSize, + shard: shard, + stmt: stmt, } } @@ -209,13 +209,15 @@ func (m *ShowMeasurementsMapper) NextChunk() (interface{}, error) { // nextChunk implements next chunk logic for a local shard. func (m *ShowMeasurementsMapper) nextChunk() (interface{}, error) { // Allocate array to hold measurement names. - names := make([]string, 0, m.chunkSize) + names := make([]string, 0, m.ChunkSize) + // Get the channel of measurement names from the state. measurementNames := m.state.(chan string) + // Get the next chunk of names. for n := range measurementNames { names = append(names, n) - if len(names) == m.chunkSize { + if len(names) == m.ChunkSize { break } } diff --git a/tsdb/store.go b/tsdb/store.go index b37568dd3a..fbe5b50dd4 100644 --- a/tsdb/store.go +++ b/tsdb/store.go @@ -343,13 +343,22 @@ func (s *Store) WriteToShard(shardID uint64, points []models.Point) error { func (s *Store) CreateMapper(shardID uint64, stmt influxql.Statement, chunkSize int) (Mapper, error) { shard := s.Shard(shardID) - switch st := stmt.(type) { + switch stmt := stmt.(type) { case *influxql.SelectStatement: - return NewSelectMapper(shard, st, chunkSize), nil + if (stmt.IsRawQuery && !stmt.HasDistinct()) || stmt.IsSimpleDerivative() { + m := NewRawMapper(shard, stmt) + m.ChunkSize = chunkSize + return m, nil + } + return NewAggregateMapper(shard, stmt), nil + case *influxql.ShowMeasurementsStatement: - return NewShowMeasurementsMapper(shard, st, chunkSize), nil + m := NewShowMeasurementsMapper(shard, stmt) + m.ChunkSize = chunkSize + return m, nil + default: - return nil, fmt.Errorf("can't create mapper for statement type: %v", st) + return nil, fmt.Errorf("can't create mapper for statement type: %T", stmt) } } From a5269e9cc77e2781c6d94cc7e71955facbfce4f1 Mon Sep 17 00:00:00 2001 From: Ben Johnson Date: Wed, 16 Sep 2015 15:04:37 -0600 Subject: [PATCH 3/8] rename direction to ascending. --- cmd/inspect/main.go | 2 +- tsdb/cursor.go | 53 +++++++++------------- tsdb/cursor_test.go | 90 ++++++++++++++++++------------------- tsdb/engine.go | 9 +--- tsdb/engine/b1/b1.go | 14 +++--- tsdb/engine/b1/b1_test.go | 4 +- tsdb/engine/bz1/bz1.go | 26 +++++------ tsdb/engine/bz1/bz1_test.go | 22 ++++----- tsdb/engine/wal/wal.go | 29 ++++++------ tsdb/engine/wal/wal_test.go | 32 ++++++------- tsdb/mapper.go | 8 ++-- 11 files changed, 136 insertions(+), 153 deletions(-) diff --git a/cmd/inspect/main.go b/cmd/inspect/main.go index 43b233f54f..eaae2d8913 100644 --- a/cmd/inspect/main.go +++ b/cmd/inspect/main.go @@ -78,7 +78,7 @@ func main() { for _, key := range series { fieldSummary := []string{} - cursor := tx.Cursor(key, tsdb.Forward) + cursor := tx.Cursor(key, true) // Series doesn't exist in this shard if cursor == nil { diff --git a/tsdb/cursor.go b/tsdb/cursor.go index 7fb2377084..ac6a4c7421 100644 --- a/tsdb/cursor.go +++ b/tsdb/cursor.go @@ -10,31 +10,11 @@ import ( "github.com/influxdb/influxdb/influxql" ) -// Direction represents a cursor navigation direction. -type Direction bool - -const ( - // Forward indicates that a cursor will move forward over its values. - Forward Direction = true - // Reverse indicates that a cursor will move backwards over its values. - Reverse Direction = false -) - -func (d Direction) String() string { - if d.Forward() { - return "forward" - } - return "reverse" -} - -// Forward returns true if direction is forward -func (d Direction) Forward() bool { - return d == Forward -} - -// Forward returns true if direction is reverse -func (d Direction) Reverse() bool { - return d == Reverse +// Cursor represents an iterator over a series. +type Cursor interface { + Seek(seek []byte) (key, value []byte) + Next() (key, value []byte) + Ascending() bool } // MultiCursor returns a single cursor that combines the results of all cursors in order. @@ -42,16 +22,17 @@ func (d Direction) Reverse() bool { // If the same key is returned from multiple cursors then the first cursor // specified will take precendence. A key will only be returned once from the // returned cursor. -func MultiCursor(d Direction, cursors ...Cursor) Cursor { - return &multiCursor{cursors: cursors, direction: d} +func MultiCursor(cursors ...Cursor) Cursor { + return &multiCursor{ + cursors: cursors, + } } // multiCursor represents a cursor that combines multiple cursors into one. type multiCursor struct { - cursors []Cursor - heap cursorHeap - prev []byte - direction Direction + cursors []Cursor + heap cursorHeap + prev []byte } // Seek moves the cursor to a given key. @@ -81,7 +62,13 @@ func (mc *multiCursor) Seek(seek []byte) (key, value []byte) { return mc.pop() } -func (mc *multiCursor) Direction() Direction { return mc.direction } +// Ascending returns the direction of the first cursor. +func (mc *multiCursor) Ascending() bool { + if len(mc.cursors) == 0 { + return true + } + return mc.cursors[0].Ascending() +} // Next returns the next key/value from the cursor. func (mc *multiCursor) Next() (key, value []byte) { return mc.pop() } @@ -126,7 +113,7 @@ func (h cursorHeap) Len() int { return len(h) } func (h cursorHeap) Swap(i, j int) { h[i], h[j] = h[j], h[i] } func (h cursorHeap) Less(i, j int) bool { dir := -1 - if !h[i].cursor.Direction() { + if !h[i].cursor.Ascending() { dir = 1 } diff --git a/tsdb/cursor_test.go b/tsdb/cursor_test.go index a07f333a50..789391fc6c 100644 --- a/tsdb/cursor_test.go +++ b/tsdb/cursor_test.go @@ -14,13 +14,11 @@ import ( // Ensure the multi-cursor can correctly iterate across a single subcursor. func TestMultiCursor_Single(t *testing.T) { - mc := tsdb.MultiCursor(tsdb.Forward, - NewCursor(tsdb.Forward, []CursorItem{ - {Key: []byte{0x00}, Value: []byte{0x00}}, - {Key: []byte{0x01}, Value: []byte{0x10}}, - {Key: []byte{0x02}, Value: []byte{0x20}}, - }), - ) + mc := tsdb.MultiCursor(NewCursor([]CursorItem{ + {Key: []byte{0x00}, Value: []byte{0x00}}, + {Key: []byte{0x01}, Value: []byte{0x10}}, + {Key: []byte{0x02}, Value: []byte{0x20}}, + }, true)) if k, v := mc.Seek([]byte{0x00}); !bytes.Equal(k, []byte{0x00}) || !bytes.Equal(v, []byte{0x00}) { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -35,13 +33,11 @@ func TestMultiCursor_Single(t *testing.T) { // Ensure the multi-cursor can correctly iterate across a single subcursor in reverse order. func TestMultiCursor_Single_Reverse(t *testing.T) { - mc := tsdb.MultiCursor(tsdb.Reverse, - NewCursor(tsdb.Reverse, []CursorItem{ - {Key: []byte{0x00}, Value: []byte{0x00}}, - {Key: []byte{0x01}, Value: []byte{0x10}}, - {Key: []byte{0x02}, Value: []byte{0x20}}, - }), - ) + mc := tsdb.MultiCursor(NewCursor([]CursorItem{ + {Key: []byte{0x00}, Value: []byte{0x00}}, + {Key: []byte{0x01}, Value: []byte{0x10}}, + {Key: []byte{0x02}, Value: []byte{0x20}}, + }, false)) if k, v := mc.Seek([]byte{0x02}); !bytes.Equal(k, []byte{0x02}) || !bytes.Equal(v, []byte{0x20}) { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -56,16 +52,16 @@ func TestMultiCursor_Single_Reverse(t *testing.T) { // Ensure the multi-cursor can correctly iterate across multiple non-overlapping subcursors. func TestMultiCursor_Multiple_NonOverlapping(t *testing.T) { - mc := tsdb.MultiCursor(tsdb.Forward, - NewCursor(tsdb.Forward, []CursorItem{ + mc := tsdb.MultiCursor( + NewCursor([]CursorItem{ {Key: []byte{0x00}, Value: []byte{0x00}}, {Key: []byte{0x03}, Value: []byte{0x30}}, {Key: []byte{0x04}, Value: []byte{0x40}}, - }), - NewCursor(tsdb.Forward, []CursorItem{ + }, true), + NewCursor([]CursorItem{ {Key: []byte{0x01}, Value: []byte{0x10}}, {Key: []byte{0x02}, Value: []byte{0x20}}, - }), + }, true), ) if k, v := mc.Seek([]byte{0x00}); !bytes.Equal(k, []byte{0x00}) || !bytes.Equal(v, []byte{0x00}) { @@ -85,16 +81,16 @@ func TestMultiCursor_Multiple_NonOverlapping(t *testing.T) { // Ensure the multi-cursor can correctly iterate across multiple non-overlapping subcursors. func TestMultiCursor_Multiple_NonOverlapping_Reverse(t *testing.T) { - mc := tsdb.MultiCursor(tsdb.Reverse, - NewCursor(tsdb.Reverse, []CursorItem{ + mc := tsdb.MultiCursor( + NewCursor([]CursorItem{ {Key: []byte{0x00}, Value: []byte{0x00}}, {Key: []byte{0x03}, Value: []byte{0x30}}, {Key: []byte{0x04}, Value: []byte{0x40}}, - }), - NewCursor(tsdb.Reverse, []CursorItem{ + }, false), + NewCursor([]CursorItem{ {Key: []byte{0x01}, Value: []byte{0x10}}, {Key: []byte{0x02}, Value: []byte{0x20}}, - }), + }, false), ) if k, v := mc.Seek([]byte{0x04}); !bytes.Equal(k, []byte{0x04}) || !bytes.Equal(v, []byte{0x40}) { @@ -114,17 +110,17 @@ func TestMultiCursor_Multiple_NonOverlapping_Reverse(t *testing.T) { // Ensure the multi-cursor can correctly iterate across multiple overlapping subcursors. func TestMultiCursor_Multiple_Overlapping(t *testing.T) { - mc := tsdb.MultiCursor(tsdb.Forward, - NewCursor(tsdb.Forward, []CursorItem{ + mc := tsdb.MultiCursor( + NewCursor([]CursorItem{ {Key: []byte{0x00}, Value: []byte{0x00}}, {Key: []byte{0x03}, Value: []byte{0x03}}, {Key: []byte{0x04}, Value: []byte{0x04}}, - }), - NewCursor(tsdb.Forward, []CursorItem{ + }, true), + NewCursor([]CursorItem{ {Key: []byte{0x00}, Value: []byte{0xF0}}, {Key: []byte{0x02}, Value: []byte{0xF2}}, {Key: []byte{0x04}, Value: []byte{0xF4}}, - }), + }, true), ) if k, v := mc.Seek([]byte{0x00}); !bytes.Equal(k, []byte{0x00}) || !bytes.Equal(v, []byte{0x00}) { @@ -142,17 +138,17 @@ func TestMultiCursor_Multiple_Overlapping(t *testing.T) { // Ensure the multi-cursor can correctly iterate across multiple overlapping subcursors. func TestMultiCursor_Multiple_Overlapping_Reverse(t *testing.T) { - mc := tsdb.MultiCursor(tsdb.Reverse, - NewCursor(tsdb.Reverse, []CursorItem{ + mc := tsdb.MultiCursor( + NewCursor([]CursorItem{ {Key: []byte{0x00}, Value: []byte{0x00}}, {Key: []byte{0x03}, Value: []byte{0x03}}, {Key: []byte{0x04}, Value: []byte{0x04}}, - }), - NewCursor(tsdb.Reverse, []CursorItem{ + }, false), + NewCursor([]CursorItem{ {Key: []byte{0x00}, Value: []byte{0xF0}}, {Key: []byte{0x02}, Value: []byte{0xF2}}, {Key: []byte{0x04}, Value: []byte{0xF4}}, - }), + }, false), ) if k, v := mc.Seek([]byte{0x04}); !bytes.Equal(k, []byte{0x04}) || !bytes.Equal(v, []byte{0x04}) { @@ -196,7 +192,7 @@ func TestMultiCursor_Quick(t *testing.T) { sort.Sort(byteSlices(exp)) // Create multi-cursor and iterate over all items. - mc := tsdb.MultiCursor(tsdb.Forward, tsdbCursorSlice(cursors)...) + mc := tsdb.MultiCursor(tsdbCursorSlice(cursors)...) for k, v := mc.Seek(u64tob(seek)); k != nil; k, v = mc.Next() { got = append(got, append(k, v...)) } @@ -212,27 +208,31 @@ func TestMultiCursor_Quick(t *testing.T) { // Cursor represents an in-memory test cursor. type Cursor struct { - direction tsdb.Direction items []CursorItem index int + ascending bool } // NewCursor returns a new instance of Cursor. -func NewCursor(direction tsdb.Direction, items []CursorItem) *Cursor { +func NewCursor(items []CursorItem, ascending bool) *Cursor { index := 0 sort.Sort(CursorItems(items)) - if direction.Reverse() { + if !ascending { index = len(items) } - return &Cursor{direction: direction, items: items, index: index} + return &Cursor{ + items: items, + index: index, + ascending: ascending, + } } -func (c *Cursor) Direction() tsdb.Direction { return c.direction } +func (c *Cursor) Ascending() bool { return c.ascending } // Seek seeks to an item by key. func (c *Cursor) Seek(seek []byte) (key, value []byte) { - if c.direction.Forward() { + if c.ascending { return c.seekForward(seek) } return c.seekReverse(seek) @@ -260,17 +260,17 @@ func (c *Cursor) seekReverse(seek []byte) (key, value []byte) { // Next returns the next key/value pair. func (c *Cursor) Next() (key, value []byte) { - if c.direction.Reverse() && c.index < 0 { + if !c.ascending && c.index < 0 { return nil, nil } - if c.direction.Forward() && c.index >= len(c.items) { + if c.ascending && c.index >= len(c.items) { return nil, nil } k, v := c.items[c.index].Key, c.items[c.index].Value - if c.direction.Forward() { + if c.ascending { c.index++ } else { c.index-- @@ -281,7 +281,7 @@ func (c *Cursor) Next() (key, value []byte) { // Generate returns a randomly generated cursor. Implements quick.Generator. func (c Cursor) Generate(rand *rand.Rand, size int) reflect.Value { c.index = 0 - c.direction = tsdb.Forward + c.ascending = true c.items = make([]CursorItem, rand.Intn(size)) for i := range c.items { diff --git a/tsdb/engine.go b/tsdb/engine.go index 9be48a1cc9..fd77da7f54 100644 --- a/tsdb/engine.go +++ b/tsdb/engine.go @@ -121,19 +121,12 @@ func NewEngineOptions() EngineOptions { type Tx interface { io.WriterTo - Cursor(series string, direction Direction) Cursor + Cursor(series string, ascending bool) Cursor Size() int64 Commit() error Rollback() error } -// Cursor represents an iterator over a series. -type Cursor interface { - Seek(seek []byte) (key, value []byte) - Next() (key, value []byte) - Direction() Direction -} - // DedupeEntries returns slices with unique keys (the first 8 bytes). func DedupeEntries(a [][]byte) [][]byte { // Convert to a map where the last slice is used. diff --git a/tsdb/engine/b1/b1.go b/tsdb/engine/b1/b1.go index 5efb732e04..3f8aaec313 100644 --- a/tsdb/engine/b1/b1.go +++ b/tsdb/engine/b1/b1.go @@ -551,7 +551,7 @@ type Tx struct { } // Cursor returns an iterator for a key. -func (tx *Tx) Cursor(key string, direction tsdb.Direction) tsdb.Cursor { +func (tx *Tx) Cursor(key string, ascending bool) tsdb.Cursor { // Retrieve key bucket. b := tx.Bucket([]byte(key)) @@ -569,13 +569,13 @@ func (tx *Tx) Cursor(key string, direction tsdb.Direction) tsdb.Cursor { copy(cache, tx.engine.cache[partitionID][key]) // Build a cursor that merges the bucket and cache together. - cur := &Cursor{cache: cache, direction: direction} + cur := &Cursor{cache: cache, ascending: ascending} if b != nil { cur.cursor = b.Cursor() } // If it's a reverse cursor, set the current location to the end. - if direction.Reverse() { + if !ascending { cur.index = len(cache) - 1 if cur.cursor != nil { cur.cursor.Last() @@ -600,10 +600,10 @@ type Cursor struct { prev []byte // The direction the cursor pointer moves after each call to Next() - direction tsdb.Direction + ascending bool } -func (c *Cursor) Direction() tsdb.Direction { return c.direction } +func (c *Cursor) Ascending() bool { return c.ascending } // Seek moves the cursor to a position and returns the closest key/value pair. func (c *Cursor) Seek(seek []byte) (key, value []byte) { @@ -619,7 +619,7 @@ func (c *Cursor) Seek(seek []byte) (key, value []byte) { // Search will return an index after the length of cache if the seek value is greater // than all the values. Clamp it to the end of the cache. - if c.direction.Reverse() && c.index >= len(c.cache) { + if !c.ascending && c.index >= len(c.cache) { c.index = len(c.cache) - 1 } @@ -636,7 +636,7 @@ func (c *Cursor) Next() (key, value []byte) { func (c *Cursor) read() (key, value []byte) { // Continue skipping ahead through duplicate keys in the cache list. for { - if c.direction.Forward() { + if c.ascending { key, value = c.readForward() } else { key, value = c.readReverse() diff --git a/tsdb/engine/b1/b1_test.go b/tsdb/engine/b1/b1_test.go index 21cd7b590d..4589d1c30b 100644 --- a/tsdb/engine/b1/b1_test.go +++ b/tsdb/engine/b1/b1_test.go @@ -66,7 +66,7 @@ func TestEngine_WritePoints(t *testing.T) { tx := e.MustBegin(false) defer tx.Rollback() - c := tx.Cursor("temperature", tsdb.Forward) + c := tx.Cursor("temperature", true) if k, v := c.Seek([]byte{0}); !bytes.Equal(k, u64tob(uint64(time.Unix(1434059627, 0).UnixNano()))) { t.Fatalf("unexpected key: %#v", k) } else if m, err := mf.Codec.DecodeFieldsWithNames(v); err != nil { @@ -131,7 +131,7 @@ func TestEngine_WritePoints_Reverse(t *testing.T) { tx := e.MustBegin(false) defer tx.Rollback() - c := tx.Cursor("temperature", tsdb.Reverse) + c := tx.Cursor("temperature", false) if k, _ := c.Seek(u64tob(math.MaxInt64)); !bytes.Equal(k, u64tob(uint64(time.Unix(1, 0).UnixNano()))) { t.Fatalf("unexpected key: %v", btou64(k)) } else if k, v := c.Next(); !bytes.Equal(k, u64tob(uint64(time.Unix(0, 0).UnixNano()))) { diff --git a/tsdb/engine/bz1/bz1.go b/tsdb/engine/bz1/bz1.go index a1fd35b0c1..7edc9a8291 100644 --- a/tsdb/engine/bz1/bz1.go +++ b/tsdb/engine/bz1/bz1.go @@ -74,7 +74,7 @@ type WAL interface { WritePoints(points []models.Point, measurementFieldsToSave map[string]*tsdb.MeasurementFields, seriesToCreate []*tsdb.SeriesCreate) error LoadMetadataIndex(index *tsdb.DatabaseIndex, measurementFields map[string]*tsdb.MeasurementFields) error DeleteSeries(keys []string) error - Cursor(key string, direction tsdb.Direction) tsdb.Cursor + Cursor(key string, ascending bool) tsdb.Cursor Open() error Close() error Flush() error @@ -623,8 +623,8 @@ type Tx struct { } // Cursor returns an iterator for a key. -func (tx *Tx) Cursor(key string, direction tsdb.Direction) tsdb.Cursor { - walCursor := tx.wal.Cursor(key, direction) +func (tx *Tx) Cursor(key string, ascending bool) tsdb.Cursor { + walCursor := tx.wal.Cursor(key, ascending) // Retrieve points bucket. Ignore if there is no bucket. b := tx.Bucket([]byte("points")).Bucket([]byte(key)) @@ -634,14 +634,14 @@ func (tx *Tx) Cursor(key string, direction tsdb.Direction) tsdb.Cursor { c := &Cursor{ cursor: b.Cursor(), - direction: direction, + ascending: ascending, } - if direction.Reverse() { + if !ascending { c.last() } - return tsdb.MultiCursor(direction, walCursor, c) + return tsdb.MultiCursor(walCursor, c) } // Cursor provides ordered iteration across a series. @@ -649,7 +649,7 @@ type Cursor struct { cursor *bolt.Cursor buf []byte // uncompressed buffer off int // buffer offset - direction tsdb.Direction + ascending bool fieldIndices []int index int } @@ -659,7 +659,7 @@ func (c *Cursor) last() { c.setBuf(v) } -func (c *Cursor) Direction() tsdb.Direction { return c.direction } +func (c *Cursor) Ascending() bool { return c.ascending } // Seek moves the cursor to a position and returns the closest key/value pair. func (c *Cursor) Seek(seek []byte) (key, value []byte) { @@ -695,13 +695,13 @@ func (c *Cursor) seekBuf(seek []byte) (key, value []byte) { return } - if c.direction.Forward() && bytes.Compare(buf[0:8], seek) != -1 { + if c.ascending && bytes.Compare(buf[0:8], seek) != -1 { return - } else if c.direction.Reverse() && bytes.Compare(buf[0:8], seek) != 1 { + } else if !c.ascending && bytes.Compare(buf[0:8], seek) != 1 { return } - if c.direction.Forward() { + if c.ascending { // Otherwise skip ahead to the next entry. c.off += entryHeaderSize + entryDataSize(buf) } else { @@ -721,7 +721,7 @@ func (c *Cursor) Next() (key, value []byte) { return nil, nil } - if c.direction.Forward() { + if c.ascending { // Move forward to next entry. c.off += entryHeaderSize + entryDataSize(c.buf[c.off:]) } else { @@ -762,7 +762,7 @@ func (c *Cursor) setBuf(block []byte) { log.Printf("block decode error: %s", err) } - if c.direction.Forward() { + if c.ascending { c.buf, c.off = buf, 0 } else { c.buf, c.off = buf, 0 diff --git a/tsdb/engine/bz1/bz1_test.go b/tsdb/engine/bz1/bz1_test.go index 1a72068131..957ec930af 100644 --- a/tsdb/engine/bz1/bz1_test.go +++ b/tsdb/engine/bz1/bz1_test.go @@ -177,7 +177,7 @@ func TestEngine_WriteIndex_Append(t *testing.T) { defer tx.Rollback() // Iterate over "cpu" series. - c := tx.Cursor("cpu", tsdb.Forward) + c := tx.Cursor("cpu", true) if k, v := c.Seek(u64tob(0)); !reflect.DeepEqual(k, []byte{0, 0, 0, 0, 0, 0, 0, 1}) || !reflect.DeepEqual(v, []byte{0x10}) { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = c.Next(); !reflect.DeepEqual(k, []byte{0, 0, 0, 0, 0, 0, 0, 2}) || !reflect.DeepEqual(v, []byte{0x20}) { @@ -187,7 +187,7 @@ func TestEngine_WriteIndex_Append(t *testing.T) { } // Iterate over "mem" series. - c = tx.Cursor("mem", tsdb.Forward) + c = tx.Cursor("mem", true) if k, v := c.Seek(u64tob(0)); !reflect.DeepEqual(k, []byte{0, 0, 0, 0, 0, 0, 0, 0}) || !reflect.DeepEqual(v, []byte{0x30}) { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, _ = c.Next(); k != nil { @@ -237,7 +237,7 @@ func TestEngine_WriteIndex_Insert(t *testing.T) { defer tx.Rollback() // Iterate over "cpu" series. - c := tx.Cursor("cpu", tsdb.Forward) + c := tx.Cursor("cpu", true) if k, v := c.Seek(u64tob(0)); btou64(k) != 9 || !bytes.Equal(v, []byte{0x09}) { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = c.Next(); btou64(k) != 10 || !bytes.Equal(v, []byte{0xFF}) { @@ -295,7 +295,7 @@ func TestEngine_Cursor_Reverse(t *testing.T) { defer tx.Rollback() // Iterate over "cpu" series. - c := tx.Cursor("cpu", tsdb.Reverse) + c := tx.Cursor("cpu", false) if k, v := c.Seek(u64tob(math.MaxUint64)); btou64(k) != 31 || !bytes.Equal(v, []byte{0xFF}) { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = c.Next(); btou64(k) != 30 || !bytes.Equal(v, []byte{0x30}) { @@ -336,7 +336,7 @@ func TestEngine_WriteIndex_SeekAgainstInBlockValue(t *testing.T) { defer tx.Rollback() // Ensure that we can seek to a block in the middle - c := tx.Cursor("cpu", tsdb.Forward) + c := tx.Cursor("cpu", true) if k, _ := c.Seek(u64tob(15)); btou64(k) != 20 { t.Fatalf("expected to seek to time 20, but got %d", btou64(k)) } @@ -394,7 +394,7 @@ func TestEngine_WriteIndex_Quick(t *testing.T) { // Iterate over results to ensure they are correct. for _, key := range keys { - c := tx.Cursor(key, tsdb.Forward) + c := tx.Cursor(key, true) // Read list of key/values. var got [][]byte @@ -441,7 +441,7 @@ func TestEngine_WriteIndex_Quick_Append(t *testing.T) { // Iterate over results to ensure they are correct. for _, key := range keys { - c := tx.Cursor(key, tsdb.Forward) + c := tx.Cursor(key, true) // Read list of key/values. var got [][]byte @@ -583,18 +583,18 @@ func (w *EnginePointsWriter) Open() error { return nil } func (w *EnginePointsWriter) Close() error { return nil } -func (w *EnginePointsWriter) Cursor(key string, direction tsdb.Direction) tsdb.Cursor { - return &Cursor{direction: direction} +func (w *EnginePointsWriter) Cursor(key string, ascending bool) tsdb.Cursor { + return &Cursor{ascending: ascending} } func (w *EnginePointsWriter) Flush() error { return nil } // Cursor represents a mock that implements tsdb.Curosr. type Cursor struct { - direction tsdb.Direction + ascending bool } -func (c *Cursor) Direction() tsdb.Direction { return c.direction } +func (c *Cursor) Ascending() bool { return c.ascending } func (c *Cursor) Seek(key []byte) ([]byte, []byte) { return nil, nil } diff --git a/tsdb/engine/wal/wal.go b/tsdb/engine/wal/wal.go index 30571a1800..bd939a7bb4 100644 --- a/tsdb/engine/wal/wal.go +++ b/tsdb/engine/wal/wal.go @@ -255,11 +255,10 @@ func (l *Log) DiskSize() (int64, error) { } // Cursor will return a cursor object to Seek and iterate with Next for the WAL cache for the given -func (l *Log) Cursor(key string, direction tsdb.Direction) tsdb.Cursor { +func (l *Log) Cursor(key string, ascending bool) tsdb.Cursor { l.mu.RLock() defer l.mu.RUnlock() - - return l.partition.cursor(key, direction) + return l.partition.cursor(key, ascending) } func (l *Log) WritePoints(points []models.Point, fields map[string]*tsdb.MeasurementFields, series []*tsdb.SeriesCreate) error { @@ -1215,7 +1214,7 @@ func (p *Partition) addToCache(key, data []byte, timestamp int64) { } // cursor will combine the in memory cache and flush cache (if a flush is currently happening) to give a single ordered cursor for the key -func (p *Partition) cursor(key string, direction tsdb.Direction) *cursor { +func (p *Partition) cursor(key string, ascending bool) *cursor { p.mu.Lock() defer p.mu.Unlock() @@ -1233,7 +1232,7 @@ func (p *Partition) cursor(key string, direction tsdb.Direction) *cursor { c = append(c, entry.points...) dedupe := tsdb.DedupeEntries(c) - return newCursor(dedupe, direction) + return newCursor(dedupe, ascending) } } @@ -1245,7 +1244,7 @@ func (p *Partition) cursor(key string, direction tsdb.Direction) *cursor { // build a copy so modifications to the partition don't change the result set a := make([][]byte, len(entry.points)) copy(a, entry.points) - return newCursor(a, direction) + return newCursor(a, ascending) } // idFromFileName parses the segment file ID from its name @@ -1408,20 +1407,24 @@ type entry struct { type cursor struct { cache [][]byte position int - direction tsdb.Direction + ascending bool } -func newCursor(cache [][]byte, direction tsdb.Direction) *cursor { +func newCursor(cache [][]byte, ascending bool) *cursor { // position is set such that a call to Next will successfully advance // to the next postion and return the value. - c := &cursor{cache: cache, direction: direction, position: -1} - if direction.Reverse() { + c := &cursor{ + cache: cache, + ascending: ascending, + position: -1, + } + if !ascending { c.position = len(c.cache) } return c } -func (c *cursor) Direction() tsdb.Direction { return c.direction } +func (c *cursor) Ascending() bool { return c.ascending } // Seek will point the cursor to the given time (or key) func (c *cursor) Seek(seek []byte) (key, value []byte) { @@ -1431,7 +1434,7 @@ func (c *cursor) Seek(seek []byte) (key, value []byte) { }) // If seek is not in the cache, return the last value in the cache - if c.direction.Reverse() && c.position >= len(c.cache) { + if !c.ascending && c.position >= len(c.cache) { c.position = len(c.cache) } @@ -1452,7 +1455,7 @@ func (c *cursor) Seek(seek []byte) (key, value []byte) { // Next moves the cursor to the next key/value. will return nil if at the end func (c *cursor) Next() (key, value []byte) { var v []byte - if c.direction.Forward() { + if c.ascending { v = c.nextForward() } else { v = c.nextReverse() diff --git a/tsdb/engine/wal/wal_test.go b/tsdb/engine/wal/wal_test.go index 82f97f86c1..03fb4c9e4f 100644 --- a/tsdb/engine/wal/wal_test.go +++ b/tsdb/engine/wal/wal_test.go @@ -41,7 +41,7 @@ func TestWAL_WritePoints(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", tsdb.Forward) + c := log.Cursor("cpu,host=A", true) k, v := c.Seek(inttob(1)) // ensure the series are there and points are in order @@ -59,7 +59,7 @@ func TestWAL_WritePoints(t *testing.T) { t.Fatalf("expected nil on last seek: %v %v", k, v) } - c = log.Cursor("cpu,host=B", tsdb.Forward) + c = log.Cursor("cpu,host=B", true) k, v = c.Next() if bytes.Compare(v, p3.Data()) != 0 { t.Fatalf("expected to seek to first point but got key and value: %v %v", k, v) @@ -98,7 +98,7 @@ func TestWAL_WritePoints(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c = log.Cursor("cpu,host=A", tsdb.Forward) + c = log.Cursor("cpu,host=A", true) k, v = c.Next() if bytes.Compare(v, p6.Data()) != 0 { t.Fatal("order wrong, expected p6") @@ -108,7 +108,7 @@ func TestWAL_WritePoints(t *testing.T) { t.Fatal("order wrong, expected p6") } - c = log.Cursor("cpu,host=C", tsdb.Forward) + c = log.Cursor("cpu,host=C", true) _, v = c.Next() if bytes.Compare(v, p5.Data()) != 0 { t.Fatal("order wrong, expected p6") @@ -156,7 +156,7 @@ func TestWAL_CorruptDataLengthSize(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", tsdb.Forward) + c := log.Cursor("cpu,host=A", true) _, v := c.Next() if bytes.Compare(v, p1.Data()) != 0 { t.Fatal("p1 value wrong") @@ -195,7 +195,7 @@ func TestWAL_CorruptDataLengthSize(t *testing.T) { t.Fatalf("failed to write point: %s", err.Error()) } - c = log.Cursor("cpu,host=A", tsdb.Forward) + c = log.Cursor("cpu,host=A", true) _, v = c.Next() if bytes.Compare(v, p3.Data()) != 0 { t.Fatal("p3 value wrong") @@ -235,7 +235,7 @@ func TestWAL_CorruptDataBlock(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", tsdb.Forward) + c := log.Cursor("cpu,host=A", true) _, v := c.Next() if bytes.Compare(v, p1.Data()) != 0 { t.Fatal("p1 value wrong") @@ -280,7 +280,7 @@ func TestWAL_CorruptDataBlock(t *testing.T) { t.Fatalf("failed to write point: %s", err.Error()) } - c = log.Cursor("cpu,host=A", tsdb.Forward) + c = log.Cursor("cpu,host=A", true) _, v = c.Next() if bytes.Compare(v, p3.Data()) != 0 { t.Fatal("p3 value wrong", p3.Data(), v) @@ -341,7 +341,7 @@ func TestWAL_CompactAfterTimeWithoutWrite(t *testing.T) { } // ensure we have some data - c := log.Cursor("cpu,host=A,region=uswest10", tsdb.Forward) + c := log.Cursor("cpu,host=A,region=uswest10", true) k, _ := c.Next() if btou64(k) != 1 { t.Fatalf("expected first data point but got one with key: %v", k) @@ -524,12 +524,12 @@ func TestWAL_DeleteSeries(t *testing.T) { } // ensure data is there - c := log.Cursor("cpu,host=A", tsdb.Forward) + c := log.Cursor("cpu,host=A", true) if k, _ := c.Next(); btou64(k) != 1 { t.Fatal("expected data point for cpu,host=A") } - c = log.Cursor("cpu,host=B", tsdb.Forward) + c = log.Cursor("cpu,host=B", true) if k, _ := c.Next(); btou64(k) != 2 { t.Fatal("expected data point for cpu,host=B") } @@ -546,13 +546,13 @@ func TestWAL_DeleteSeries(t *testing.T) { if len(points["cpu,host=B"]) != 0 { t.Fatal("expected cpu,host=B to have no points in index") } - c = log.Cursor("cpu,host=A", tsdb.Forward) + c = log.Cursor("cpu,host=A", true) if k, _ := c.Next(); k != nil { t.Fatal("expected data to be out of the cache cpu,host=A") } // ensure series is deleted - c = log.Cursor("cpu,host=B", tsdb.Forward) + c = log.Cursor("cpu,host=B", true) if k, _ := c.Next(); k != nil { t.Fatal("expected no data for cpu,host=B") } @@ -618,7 +618,7 @@ func TestWAL_QueryDuringCompaction(t *testing.T) { } verify := func() { - c := log.Cursor("cpu,host=A", tsdb.Forward) + c := log.Cursor("cpu,host=A", true) k, v := c.Seek(inttob(1)) // ensure the series are there and points are in order if bytes.Compare(v, p1.Data()) != 0 { @@ -664,7 +664,7 @@ func TestWAL_PointsSorted(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", tsdb.Forward) + c := log.Cursor("cpu,host=A", true) k, _ := c.Next() if btou64(k) != 1 { t.Fatal("points out of order") @@ -709,7 +709,7 @@ func TestWAL_Cursor_Reverse(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", tsdb.Reverse) + c := log.Cursor("cpu,host=A", false) k, _ := c.Next() if btou64(k) != 6 { t.Fatal("points out of order") diff --git a/tsdb/mapper.go b/tsdb/mapper.go index f207d07795..4b4316c409 100644 --- a/tsdb/mapper.go +++ b/tsdb/mapper.go @@ -229,12 +229,12 @@ func (m *RawMapper) openMeasurement(mm *Measurement) (SelectInfo, error) { } // Create all cursors for reading the data from this shard. - direction := Direction(m.stmt.TimeAscending()) + ascending := m.stmt.TimeAscending() for _, t := range info.TagSets { cursors := []*seriesCursor{} for i, key := range t.SeriesKeys { - c := m.tx.Cursor(key, direction) + c := m.tx.Cursor(key, ascending) if c == nil { continue } @@ -245,7 +245,7 @@ func (m *RawMapper) openMeasurement(mm *Measurement) (SelectInfo, error) { } tsc := NewTagSetCursor(mm.Name, t.Tags, cursors, m.shard.FieldCodec(mm.Name)) - if direction.Forward() { + if ascending { tsc.SeekTo(m.qmin) } else { tsc.SeekTo(m.qmax) @@ -460,7 +460,7 @@ func (m *AggregateMapper) openMeasurement(mm *Measurement) (SelectInfo, error) { cursors := []*seriesCursor{} for i, key := range t.SeriesKeys { - c := m.tx.Cursor(key, Forward) + c := m.tx.Cursor(key, true) if c == nil { continue } From b213ddad787c1cabc8c6d75bbfe316243264af06 Mon Sep 17 00:00:00 2001 From: Ben Johnson Date: Sun, 20 Sep 2015 16:27:22 -0600 Subject: [PATCH 4/8] refactor cursor --- influxql/ast.go | 31 +++ tsdb/cursor.go | 295 ++++++++++++++-------------- tsdb/cursor_test.go | 172 +++++++++-------- tsdb/engine.go | 3 +- tsdb/engine/b1/b1.go | 79 ++++++-- tsdb/engine/b1/b1_test.go | 31 ++- tsdb/engine/bz1/bz1.go | 38 ++-- tsdb/engine/bz1/bz1_test.go | 370 ++++++++---------------------------- tsdb/engine/wal/wal.go | 66 +++++-- tsdb/engine/wal/wal_test.go | 134 +++++-------- tsdb/mapper.go | 169 ++++++++-------- tsdb/meta.go | 106 +++++------ 12 files changed, 667 insertions(+), 827 deletions(-) diff --git a/influxql/ast.go b/influxql/ast.go index 3a343d6a5c..5d2f0536d3 100644 --- a/influxql/ast.go +++ b/influxql/ast.go @@ -718,6 +718,18 @@ type SelectStatement struct { FillValue interface{} } +// SourceNames returns a list of source names. +func (s *SelectStatement) SourceNames() []string { + a := make([]string, 0, len(s.Sources)) + for _, src := range s.Sources { + switch src := src.(type) { + case *Measurement: + a = append(a, src.Name) + } + } + return a +} + // HasDerivative returns true if one of the function calls in the statement is a // derivative aggregate func (s *SelectStatement) HasDerivative() bool { @@ -1522,6 +1534,25 @@ func (s *SelectStatement) NamesInDimension() []string { return a } +// LimitTagSets returns a tag set list with SLIMIT and SOFFSET applied. +func (s *SelectStatement) LimitTagSets(a []*TagSet) []*TagSet { + // Ignore if no limit or offset is specified. + if s.SLimit == 0 && s.SOffset == 0 { + return a + } + + // If offset is beyond the number of tag sets then return nil. + if s.SOffset > len(a) { + return nil + } + + // Clamp limit to the max number of tag sets. + if s.SOffset+s.SLimit > len(a) { + s.SLimit = len(a) - s.SOffset + } + return a[s.SOffset : s.SOffset+s.SLimit] +} + // walkNames will walk the Expr and return the database fields func walkNames(exp Expr) []string { switch expr := exp.(type) { diff --git a/tsdb/cursor.go b/tsdb/cursor.go index ac6a4c7421..9e00e37404 100644 --- a/tsdb/cursor.go +++ b/tsdb/cursor.go @@ -1,7 +1,6 @@ package tsdb import ( - "bytes" "container/heap" "encoding/binary" "sort" @@ -10,10 +9,13 @@ import ( "github.com/influxdb/influxdb/influxql" ) +// EOF represents a "not found" key returned by a Cursor. +const EOF = int64(-1) + // Cursor represents an iterator over a series. type Cursor interface { - Seek(seek []byte) (key, value []byte) - Next() (key, value []byte) + Seek(seek int64) (key int64, value interface{}) + Next() (key int64, value interface{}) Ascending() bool } @@ -32,17 +34,17 @@ func MultiCursor(cursors ...Cursor) Cursor { type multiCursor struct { cursors []Cursor heap cursorHeap - prev []byte + prev int64 // previously read key } // Seek moves the cursor to a given key. -func (mc *multiCursor) Seek(seek []byte) (key, value []byte) { +func (mc *multiCursor) Seek(seek int64) (key int64, value interface{}) { // Initialize heap. h := make(cursorHeap, 0, len(mc.cursors)) for i, c := range mc.cursors { // Move cursor to position. Skip if it's empty. k, v := c.Seek(seek) - if k == nil { + if k == EOF { continue } @@ -57,7 +59,7 @@ func (mc *multiCursor) Seek(seek []byte) (key, value []byte) { heap.Init(&h) mc.heap = h - mc.prev = nil + mc.prev = EOF return mc.pop() } @@ -71,18 +73,18 @@ func (mc *multiCursor) Ascending() bool { } // Next returns the next key/value from the cursor. -func (mc *multiCursor) Next() (key, value []byte) { return mc.pop() } +func (mc *multiCursor) Next() (key int64, value interface{}) { return mc.pop() } // pop returns the next item from the heap. // Reads the next key/value from item's cursor and puts it back on the heap. -func (mc *multiCursor) pop() (key, value []byte) { +func (mc *multiCursor) pop() (key int64, value interface{}) { // Read items until we have a key that doesn't match the previously read one. // This is to perform deduplication when there's multiple items with the same key. // The highest priority cursor will be read first and then remaining keys will be dropped. for { - // Return nil if there are no more items left. + // Return EOF marker if there are no more items left. if len(mc.heap) == 0 { - return nil, nil + return EOF, nil } // Read the next item from the heap. @@ -92,12 +94,12 @@ func (mc *multiCursor) pop() (key, value []byte) { key, value = item.key, item.value // Read the next item from the cursor. Push back to heap if one exists. - if item.key, item.value = item.cursor.Next(); item.key != nil { + if item.key, item.value = item.cursor.Next(); item.key != EOF { heap.Push(&mc.heap, item) } // Skip if this key matches the previously returned one. - if bytes.Equal(mc.prev, key) { + if key == mc.prev { continue } @@ -112,17 +114,16 @@ type cursorHeap []*cursorHeapItem func (h cursorHeap) Len() int { return len(h) } func (h cursorHeap) Swap(i, j int) { h[i], h[j] = h[j], h[i] } func (h cursorHeap) Less(i, j int) bool { - dir := -1 - if !h[i].cursor.Ascending() { - dir = 1 - } - - if cmp := bytes.Compare(h[i].key, h[j].key); cmp == dir { - return true - } else if cmp == 0 { + // Use priority if the keys are the same. + if h[i].key == h[j].key { return h[i].priority > h[j].priority } - return false + + // Otherwise compare based on cursor direction. + if h[i].cursor.Ascending() { + return h[i].key < h[j].key + } + return h[i].key > h[j].key } func (h *cursorHeap) Push(x interface{}) { @@ -139,62 +140,37 @@ func (h *cursorHeap) Pop() interface{} { // cursorHeapItem is something we manage in a priority queue. type cursorHeapItem struct { - key []byte - value []byte + key int64 + value interface{} cursor Cursor priority int } -// TagSetCursor is virtual cursor that iterates over mutiple series cursors, as though it were -// a single series. +// TagSetCursor is virtual cursor that iterates over multiple TagsCursors. type TagSetCursor struct { measurement string // Measurement name tags map[string]string // Tag key-value pairs - cursors []*seriesCursor // Underlying series cursors. - decoder *FieldCodec // decoder for the raw data bytes + cursors []*TagsCursor // Underlying tags cursors. currentTags map[string]string // the current tags for the underlying series cursor in play - // pointHeap is a min-heap, ordered by timestamp, that contains the next - // point from each seriesCursor. Queries sometimes pull points from - // thousands of series. This makes it reasonably efficient to find the - // point with the next lowest timestamp among the thousands of series that - // the query is pulling points from. - // Performance profiling shows that this lookahead needs to be part - // of the TagSetCursor type and not part of the the cursors type. - pointHeap *pointHeap + SelectFields []string + WhereFields []string - // Memomize the cursor's tagset-based key. Profiling shows that calculating this - // is significant CPU cost, and it only needs to be done once. + // Min-heap of cursors ordered by timestamp. + heap *pointHeap + + // Memoize the cursor's tagset-based key. memokey string } -// TagSetCursors represents a sortable slice of TagSetCursors. -type TagSetCursors []*TagSetCursor - -func (a TagSetCursors) Len() int { return len(a) } -func (a TagSetCursors) Less(i, j int) bool { return a[i].key() < a[j].key() } -func (a TagSetCursors) Swap(i, j int) { a[i], a[j] = a[j], a[i] } - -func (a TagSetCursors) Keys() []string { - keys := []string{} - for i := range a { - keys = append(keys, a[i].key()) - } - sort.Strings(keys) - return keys -} - // NewTagSetCursor returns a instance of TagSetCursor. -func NewTagSetCursor(m string, t map[string]string, c []*seriesCursor, d *FieldCodec) *TagSetCursor { - tsc := &TagSetCursor{ +func NewTagSetCursor(m string, t map[string]string, c []*TagsCursor) *TagSetCursor { + return &TagSetCursor{ measurement: m, tags: t, cursors: c, - decoder: d, - pointHeap: newPointHeap(), + heap: newPointHeap(), } - - return tsc } func (tsc *TagSetCursor) key() string { @@ -208,20 +184,20 @@ func (tsc *TagSetCursor) key() string { return tsc.memokey } -func (tsc *TagSetCursor) SeekTo(seek int64) { - tsc.pointHeap = newPointHeap() +func (tsc *TagSetCursor) Init(seek int64) { + tsc.heap = newPointHeap() // Prime the buffers. for i := 0; i < len(tsc.cursors); i++ { - k, v := tsc.cursors[i].SeekTo(seek) - if k == -1 { + k, v := tsc.cursors[i].Seek(seek) + if k == EOF { k, v = tsc.cursors[i].Next() } - if k == -1 { + if k == EOF { continue } - heap.Push(tsc.pointHeap, &pointHeapItem{ + heap.Push(tsc.heap, &pointHeapItem{ timestamp: k, value: v, cursor: tsc.cursors[i], @@ -231,38 +207,36 @@ func (tsc *TagSetCursor) SeekTo(seek int64) { // Next returns the next matching series-key, timestamp byte slice and meta tags for the tagset. Filtering // is enforced on the values. If there is no matching value, then a nil result is returned. -func (tsc *TagSetCursor) Next(tmin, tmax int64, selectFields, whereFields []string) (int64, interface{}) { +func (tsc *TagSetCursor) Next(tmin, tmax int64) (int64, interface{}) { for { // If we're out of points, we're done. - if tsc.pointHeap.Len() == 0 { + if tsc.heap.Len() == 0 { return -1, nil } // Grab the next point with the lowest timestamp. - p := heap.Pop(tsc.pointHeap).(*pointHeapItem) + p := heap.Pop(tsc.heap).(*pointHeapItem) // We're done if the point is outside the query's time range [tmin:tmax). if p.timestamp != tmin && (p.timestamp < tmin || p.timestamp >= tmax) { return -1, nil } - // Decode the raw point. - value := tsc.decodeRawPoint(p, selectFields, whereFields) - timestamp := p.timestamp + // Save timestamp & value. + timestamp, value := p.timestamp, p.value // Keep track of the current tags for the series cursor so we can // respond with them if asked tsc.currentTags = p.cursor.tags - // Advance the cursor - nextKey, nextVal := p.cursor.Next() - if nextKey != -1 { + // Advance the cursor. + if nextKey, nextVal := p.cursor.Next(); nextKey != -1 { *p = pointHeapItem{ timestamp: nextKey, value: nextVal, cursor: p.cursor, } - heap.Push(tsc.pointHeap, p) + heap.Push(tsc.heap, p) } // Value didn't match, look for the next one. @@ -276,52 +250,51 @@ func (tsc *TagSetCursor) Next(tmin, tmax int64, selectFields, whereFields []stri // Tags returns the current tags of the current cursor // if there is no current currsor, it returns nil -func (tsc *TagSetCursor) Tags() map[string]string { - return tsc.currentTags -} +func (tsc *TagSetCursor) Tags() map[string]string { return tsc.currentTags } // decodeRawPoint decodes raw point data into field names & values and does WHERE filtering. -func (tsc *TagSetCursor) decodeRawPoint(p *pointHeapItem, selectFields, whereFields []string) interface{} { - if len(selectFields) > 1 { - if fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value); err == nil { - // if there's a where clause, make sure we don't need to filter this value - if p.cursor.filter != nil && !influxql.EvalBool(p.cursor.filter, fieldsWithNames) { - return nil - } +// func (tsc *TagSetCursor) decodeRawPoint(p *pointHeapItem) interface{} { +// if len(tsc.SelectFields) > 1 { +// if fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value); err == nil { +// // If there's a where clause, make sure we don't need to filter this value +// if p.cursor.filter != nil && !influxql.EvalBool(p.cursor.filter, fieldsWithNames) { +// return nil +// } - return fieldsWithNames - } - } +// return fieldsWithNames +// } +// } - // With only 1 field SELECTed, decoding all fields may be avoidable, which is faster. - value, err := tsc.decoder.DecodeByName(selectFields[0], p.value) - if err != nil { - return nil - } +// // With only 1 field SELECTed, decoding all fields may be avoidable, which is faster. +// value, err := tsc.decoder.DecodeByName(tsc.SelectFields[0], p.value) +// if err != nil { +// return nil +// } - // If there's a WHERE clase, see if we need to filter - if p.cursor.filter != nil { - // See if the WHERE is only on this field or on one or more other fields. - // If the latter, we'll have to decode everything - if len(whereFields) == 1 && whereFields[0] == selectFields[0] { - if !influxql.EvalBool(p.cursor.filter, map[string]interface{}{selectFields[0]: value}) { - value = nil - } - } else { // Decode everything - fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value) - if err != nil || !influxql.EvalBool(p.cursor.filter, fieldsWithNames) { - value = nil - } - } - } +// // Return value if there's no filter. +// if p.cursor.filter == nil { +// return value +// } - return value -} +// // See if the WHERE is only on this field or on one or more other fields. +// // If the latter, we'll have to decode everything +// if len(tsc.WhereFields) == 1 && tsc.WhereFields[0] == tsc.SelectFields[0] { +// if !influxql.EvalBool(p.cursor.filter, map[string]interface{}{tsc.SelectFields[0]: value}) { +// value = nil +// } +// } else { +// fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value) +// if err != nil || !influxql.EvalBool(p.cursor.filter, fieldsWithNames) { +// value = nil +// } +// } +// return value +// } type pointHeapItem struct { timestamp int64 - value []byte - cursor *seriesCursor // cursor whence pointHeapItem came + value interface{} + cursor *TagsCursor // cursor whence pointHeapItem came } type pointHeap []*pointHeapItem @@ -354,63 +327,73 @@ func (pq *pointHeap) Pop() interface{} { return item } -// seriesCursor is a cursor that walks a single series. It provides lookahead functionality. -type seriesCursor struct { - cursor Cursor // BoltDB cursor for a series - filter influxql.Expr - tags map[string]string - seekto int64 - seekResult struct { - k int64 - v []byte +// TagsCursor is a cursor with attached tags and filter. +type TagsCursor struct { + cursor Cursor + filter influxql.Expr + tags map[string]string + + seek int64 + buf struct { + key int64 + value interface{} } } -// newSeriesCursor returns a new instance of a series cursor. -func newSeriesCursor(cur Cursor, filter influxql.Expr, tags map[string]string) *seriesCursor { - return &seriesCursor{ - cursor: cur, +// NewTagsCursor returns a new instance of a series cursor. +func NewTagsCursor(c Cursor, filter influxql.Expr, tags map[string]string) *TagsCursor { + return &TagsCursor{ + cursor: c, filter: filter, tags: tags, - seekto: -1, + seek: EOF, } } -// Seek positions returning the timestamp and value at that key. -func (sc *seriesCursor) SeekTo(key int64) (timestamp int64, value []byte) { - if sc.seekto != -1 && sc.seekto < key && (sc.seekResult.k == -1 || sc.seekResult.k >= key) { - // we've seeked on this cursor. This seek is after that previous cached seek - // and the result it gave was after the key for this seek. - // - // In this case, any seek would just return what we got before, so there's - // no point in reseeking. - return sc.seekResult.k, sc.seekResult.v +// Seek positions returning the key and value at that key. +func (c *TagsCursor) Seek(seek int64) (key int64, value interface{}) { + // We've seeked on this cursor. This seek is after that previous cached seek + // and the result it gave was after the key for this seek. + // + // In this case, any seek would just return what we got before, so there's + // no point in reseeking. + if c.seek != -1 && c.seek < seek && (c.buf.key == EOF || c.buf.key >= seek) { + return c.buf.key, c.buf.value } - k, v := sc.cursor.Seek(u64tob(uint64(key))) - if k == nil { - timestamp = -1 - } else { - timestamp, value = int64(btou64(k)), v - } - sc.seekto = key - sc.seekResult.k = timestamp - sc.seekResult.v = v + + // Seek to key/value in underlying cursor. + key, value = c.cursor.Seek(seek) + + // Save the seek to the buffer. + c.seek = seek + c.buf.key, c.buf.value = key, value return } // Next returns the next timestamp and value from the cursor. -func (sc *seriesCursor) Next() (key int64, value []byte) { - // calling next on this cursor means that we need to invalidate the seek - sc.seekto = -1 - sc.seekResult.k = 0 - sc.seekResult.v = nil - k, v := sc.cursor.Next() - if k == nil { - key = -1 - } else { - key, value = int64(btou64(k)), v +func (c *TagsCursor) Next() (key int64, value interface{}) { + // Invalidate the seek. + c.seek = -1 + c.buf.key, c.buf.value = 0, nil + + // Return next key/value. + return c.cursor.Next() +} + +// TagSetCursors represents a sortable slice of TagSetCursors. +type TagSetCursors []*TagSetCursor + +func (a TagSetCursors) Len() int { return len(a) } +func (a TagSetCursors) Less(i, j int) bool { return a[i].key() < a[j].key() } +func (a TagSetCursors) Swap(i, j int) { a[i], a[j] = a[j], a[i] } + +func (a TagSetCursors) Keys() []string { + keys := []string{} + for i := range a { + keys = append(keys, a[i].key()) } - return + sort.Strings(keys) + return keys } // btou64 converts an 8-byte slice into an uint64. diff --git a/tsdb/cursor_test.go b/tsdb/cursor_test.go index 789391fc6c..55965162e3 100644 --- a/tsdb/cursor_test.go +++ b/tsdb/cursor_test.go @@ -15,18 +15,18 @@ import ( // Ensure the multi-cursor can correctly iterate across a single subcursor. func TestMultiCursor_Single(t *testing.T) { mc := tsdb.MultiCursor(NewCursor([]CursorItem{ - {Key: []byte{0x00}, Value: []byte{0x00}}, - {Key: []byte{0x01}, Value: []byte{0x10}}, - {Key: []byte{0x02}, Value: []byte{0x20}}, + {Key: 0, Value: 0}, + {Key: 1, Value: 10}, + {Key: 2, Value: 20}, }, true)) - if k, v := mc.Seek([]byte{0x00}); !bytes.Equal(k, []byte{0x00}) || !bytes.Equal(v, []byte{0x00}) { + if k, v := mc.Seek(0); k != 0 || v.(int) != 0 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x01}) || !bytes.Equal(v, []byte{0x10}) { + } else if k, v = mc.Next(); k != 1 || v.(int) != 10 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x02}) || !bytes.Equal(v, []byte{0x20}) { + } else if k, v = mc.Next(); k != 2 || v.(int) != 20 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); k != nil { + } else if k, v = mc.Next(); k != tsdb.EOF { t.Fatalf("expected eof, got: %x / %x", k, v) } } @@ -34,18 +34,18 @@ func TestMultiCursor_Single(t *testing.T) { // Ensure the multi-cursor can correctly iterate across a single subcursor in reverse order. func TestMultiCursor_Single_Reverse(t *testing.T) { mc := tsdb.MultiCursor(NewCursor([]CursorItem{ - {Key: []byte{0x00}, Value: []byte{0x00}}, - {Key: []byte{0x01}, Value: []byte{0x10}}, - {Key: []byte{0x02}, Value: []byte{0x20}}, + {Key: 0, Value: 0}, + {Key: 1, Value: 10}, + {Key: 2, Value: 20}, }, false)) - if k, v := mc.Seek([]byte{0x02}); !bytes.Equal(k, []byte{0x02}) || !bytes.Equal(v, []byte{0x20}) { + if k, v := mc.Seek(2); k != 2 || v.(int) != 20 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x01}) || !bytes.Equal(v, []byte{0x10}) { + } else if k, v = mc.Next(); k != 1 || v.(int) != 10 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x00}) || !bytes.Equal(v, []byte{0x00}) { + } else if k, v = mc.Next(); k != 0 || v.(int) != 0 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); k != nil { + } else if k, v = mc.Next(); k != tsdb.EOF { t.Fatalf("expected eof, got: %x / %x", k, v) } } @@ -54,27 +54,27 @@ func TestMultiCursor_Single_Reverse(t *testing.T) { func TestMultiCursor_Multiple_NonOverlapping(t *testing.T) { mc := tsdb.MultiCursor( NewCursor([]CursorItem{ - {Key: []byte{0x00}, Value: []byte{0x00}}, - {Key: []byte{0x03}, Value: []byte{0x30}}, - {Key: []byte{0x04}, Value: []byte{0x40}}, + {Key: 0, Value: 0}, + {Key: 3, Value: 30}, + {Key: 4, Value: 40}, }, true), NewCursor([]CursorItem{ - {Key: []byte{0x01}, Value: []byte{0x10}}, - {Key: []byte{0x02}, Value: []byte{0x20}}, + {Key: 1, Value: 10}, + {Key: 2, Value: 20}, }, true), ) - if k, v := mc.Seek([]byte{0x00}); !bytes.Equal(k, []byte{0x00}) || !bytes.Equal(v, []byte{0x00}) { + if k, v := mc.Seek(0); k != 0 || v.(int) != 0 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x01}) || !bytes.Equal(v, []byte{0x10}) { + } else if k, v = mc.Next(); k != 1 || v.(int) != 10 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x02}) || !bytes.Equal(v, []byte{0x20}) { + } else if k, v = mc.Next(); k != 2 || v.(int) != 20 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x03}) || !bytes.Equal(v, []byte{0x30}) { + } else if k, v = mc.Next(); k != 3 || v.(int) != 30 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x04}) || !bytes.Equal(v, []byte{0x40}) { + } else if k, v = mc.Next(); k != 4 || v.(int) != 40 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); k != nil { + } else if k, v = mc.Next(); k != tsdb.EOF { t.Fatalf("expected eof, got: %x / %x", k, v) } } @@ -83,27 +83,27 @@ func TestMultiCursor_Multiple_NonOverlapping(t *testing.T) { func TestMultiCursor_Multiple_NonOverlapping_Reverse(t *testing.T) { mc := tsdb.MultiCursor( NewCursor([]CursorItem{ - {Key: []byte{0x00}, Value: []byte{0x00}}, - {Key: []byte{0x03}, Value: []byte{0x30}}, - {Key: []byte{0x04}, Value: []byte{0x40}}, + {Key: 0, Value: 0}, + {Key: 3, Value: 30}, + {Key: 4, Value: 40}, }, false), NewCursor([]CursorItem{ - {Key: []byte{0x01}, Value: []byte{0x10}}, - {Key: []byte{0x02}, Value: []byte{0x20}}, + {Key: 1, Value: 10}, + {Key: 2, Value: 20}, }, false), ) - if k, v := mc.Seek([]byte{0x04}); !bytes.Equal(k, []byte{0x04}) || !bytes.Equal(v, []byte{0x40}) { + if k, v := mc.Seek(4); k != 4 || v.(int) != 40 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x03}) || !bytes.Equal(v, []byte{0x30}) { + } else if k, v = mc.Next(); k != 3 || v.(int) != 30 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x02}) || !bytes.Equal(v, []byte{0x20}) { + } else if k, v = mc.Next(); k != 2 || v.(int) != 20 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x01}) || !bytes.Equal(v, []byte{0x10}) { + } else if k, v = mc.Next(); k != 1 || v.(int) != 10 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x00}) || !bytes.Equal(v, []byte{0x00}) { + } else if k, v = mc.Next(); k != 0 || v.(int) != 00 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); k != nil { + } else if k, v = mc.Next(); k != tsdb.EOF { t.Fatalf("expected eof, got: %x / %x", k, v) } } @@ -112,26 +112,26 @@ func TestMultiCursor_Multiple_NonOverlapping_Reverse(t *testing.T) { func TestMultiCursor_Multiple_Overlapping(t *testing.T) { mc := tsdb.MultiCursor( NewCursor([]CursorItem{ - {Key: []byte{0x00}, Value: []byte{0x00}}, - {Key: []byte{0x03}, Value: []byte{0x03}}, - {Key: []byte{0x04}, Value: []byte{0x04}}, + {Key: 0, Value: 0}, + {Key: 3, Value: 3}, + {Key: 4, Value: 4}, }, true), NewCursor([]CursorItem{ - {Key: []byte{0x00}, Value: []byte{0xF0}}, - {Key: []byte{0x02}, Value: []byte{0xF2}}, - {Key: []byte{0x04}, Value: []byte{0xF4}}, + {Key: 0, Value: 0xF0}, + {Key: 2, Value: 0xF2}, + {Key: 4, Value: 0xF4}, }, true), ) - if k, v := mc.Seek([]byte{0x00}); !bytes.Equal(k, []byte{0x00}) || !bytes.Equal(v, []byte{0x00}) { + if k, v := mc.Seek(0); k != 0 || v.(int) != 0 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x02}) || !bytes.Equal(v, []byte{0xF2}) { + } else if k, v = mc.Next(); k != 2 || v.(int) != 0xF2 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x03}) || !bytes.Equal(v, []byte{0x03}) { + } else if k, v = mc.Next(); k != 3 || v.(int) != 3 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x04}) || !bytes.Equal(v, []byte{0x04}) { + } else if k, v = mc.Next(); k != 4 || v.(int) != 4 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); k != nil { + } else if k, v = mc.Next(); k != tsdb.EOF { t.Fatalf("expected eof, got: %x / %x", k, v) } } @@ -140,61 +140,61 @@ func TestMultiCursor_Multiple_Overlapping(t *testing.T) { func TestMultiCursor_Multiple_Overlapping_Reverse(t *testing.T) { mc := tsdb.MultiCursor( NewCursor([]CursorItem{ - {Key: []byte{0x00}, Value: []byte{0x00}}, - {Key: []byte{0x03}, Value: []byte{0x03}}, - {Key: []byte{0x04}, Value: []byte{0x04}}, + {Key: 0, Value: 0}, + {Key: 3, Value: 3}, + {Key: 4, Value: 4}, }, false), NewCursor([]CursorItem{ - {Key: []byte{0x00}, Value: []byte{0xF0}}, - {Key: []byte{0x02}, Value: []byte{0xF2}}, - {Key: []byte{0x04}, Value: []byte{0xF4}}, + {Key: 0, Value: 0xF0}, + {Key: 2, Value: 0xF2}, + {Key: 4, Value: 0xF4}, }, false), ) - if k, v := mc.Seek([]byte{0x04}); !bytes.Equal(k, []byte{0x04}) || !bytes.Equal(v, []byte{0x04}) { + if k, v := mc.Seek(4); k != 4 || v.(int) != 4 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x03}) || !bytes.Equal(v, []byte{0x03}) { + } else if k, v = mc.Next(); k != 3 || v.(int) != 3 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x02}) || !bytes.Equal(v, []byte{0xF2}) { + } else if k, v = mc.Next(); k != 2 || v.(int) != 0xF2 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); !bytes.Equal(k, []byte{0x00}) || !bytes.Equal(v, []byte{0x00}) { + } else if k, v = mc.Next(); k != 0 || v.(int) != 0 { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = mc.Next(); k != nil { + } else if k, v = mc.Next(); k != tsdb.EOF { t.Fatalf("expected eof, got: %x / %x", k, v) } } // Ensure the multi-cursor can handle randomly generated data. func TestMultiCursor_Quick(t *testing.T) { - quick.Check(func(seek uint64, cursors []Cursor) bool { - var got, exp [][]byte - seek %= 100 + quick.Check(func(useek uint64, cursors []Cursor) bool { + var got, exp []CursorItem + seek := int64(useek) % 100 // Merge all cursor data to determine expected output. // First seen key overrides all other items with the same key. - m := make(map[string][]byte) + m := make(map[int64]CursorItem) for _, c := range cursors { for _, item := range c.items { - if bytes.Compare(item.Key, u64tob(seek)) == -1 { + if item.Key < seek { continue } - if _, ok := m[string(item.Key)]; ok { + if _, ok := m[item.Key]; ok { continue } - m[string(item.Key)] = item.Value + m[item.Key] = item } } // Convert map back to single item list. - for k, v := range m { - exp = append(exp, append([]byte(k), v...)) + for _, item := range m { + exp = append(exp, item) } - sort.Sort(byteSlices(exp)) + sort.Sort(CursorItems(exp)) // Create multi-cursor and iterate over all items. mc := tsdb.MultiCursor(tsdbCursorSlice(cursors)...) - for k, v := mc.Seek(u64tob(seek)); k != nil; k, v = mc.Next() { - got = append(got, append(k, v...)) + for k, v := mc.Seek(seek); k != tsdb.EOF; k, v = mc.Next() { + got = append(got, CursorItem{k, v.(int)}) } // Verify results. @@ -231,41 +231,41 @@ func NewCursor(items []CursorItem, ascending bool) *Cursor { func (c *Cursor) Ascending() bool { return c.ascending } // Seek seeks to an item by key. -func (c *Cursor) Seek(seek []byte) (key, value []byte) { +func (c *Cursor) Seek(seek int64) (key int64, value interface{}) { if c.ascending { return c.seekForward(seek) } return c.seekReverse(seek) } -func (c *Cursor) seekForward(seek []byte) (key, value []byte) { +func (c *Cursor) seekForward(seek int64) (key int64, value interface{}) { for c.index = 0; c.index < len(c.items); c.index++ { - if bytes.Compare(c.items[c.index].Key, seek) == -1 { // skip keys less than seek + if c.items[c.index].Key < seek { // skip keys less than seek continue } return c.items[c.index].Key, c.items[c.index].Value } - return nil, nil + return tsdb.EOF, nil } -func (c *Cursor) seekReverse(seek []byte) (key, value []byte) { +func (c *Cursor) seekReverse(seek int64) (key int64, value interface{}) { for c.index = len(c.items) - 1; c.index >= 0; c.index-- { - if bytes.Compare(c.items[c.index].Key, seek) == 1 { // skip keys greater than seek + if c.items[c.index].Key > seek { // skip keys greater than seek continue } return c.items[c.index].Key, c.items[c.index].Value } - return nil, nil + return tsdb.EOF, nil } // Next returns the next key/value pair. -func (c *Cursor) Next() (key, value []byte) { +func (c *Cursor) Next() (key int64, value interface{}) { if !c.ascending && c.index < 0 { - return nil, nil + return tsdb.EOF, nil } if c.ascending && c.index >= len(c.items) { - return nil, nil + return tsdb.EOF, nil } k, v := c.items[c.index].Key, c.items[c.index].Value @@ -285,11 +285,9 @@ func (c Cursor) Generate(rand *rand.Rand, size int) reflect.Value { c.items = make([]CursorItem, rand.Intn(size)) for i := range c.items { - value, _ := quick.Value(reflect.TypeOf([]byte(nil)), rand) - c.items[i] = CursorItem{ - Key: u64tob(uint64(rand.Intn(size))), - Value: value.Interface().([]byte), + Key: rand.Int63n(int64(size)), + Value: rand.Int(), } } @@ -310,15 +308,15 @@ func tsdbCursorSlice(a []Cursor) []tsdb.Cursor { // CursorItem represents a key/value pair in a cursor. type CursorItem struct { - Key []byte - Value []byte + Key int64 + Value int } type CursorItems []CursorItem func (a CursorItems) Len() int { return len(a) } func (a CursorItems) Swap(i, j int) { a[i], a[j] = a[j], a[i] } -func (a CursorItems) Less(i, j int) bool { return bytes.Compare(a[i].Key, a[j].Key) == -1 } +func (a CursorItems) Less(i, j int) bool { return a[i].Key < a[j].Key } // byteSlices represents a sortable slice of byte slices. type byteSlices [][]byte diff --git a/tsdb/engine.go b/tsdb/engine.go index fd77da7f54..c8d5946139 100644 --- a/tsdb/engine.go +++ b/tsdb/engine.go @@ -121,10 +121,11 @@ func NewEngineOptions() EngineOptions { type Tx interface { io.WriterTo - Cursor(series string, ascending bool) Cursor Size() int64 Commit() error Rollback() error + + Cursor(series string, fields []string, dec *FieldCodec, ascending bool) Cursor } // DedupeEntries returns slices with unique keys (the first 8 bytes). diff --git a/tsdb/engine/b1/b1.go b/tsdb/engine/b1/b1.go index 3f8aaec313..f8f6fb65bf 100644 --- a/tsdb/engine/b1/b1.go +++ b/tsdb/engine/b1/b1.go @@ -550,26 +550,31 @@ type Tx struct { engine *Engine } -// Cursor returns an iterator for a key. -func (tx *Tx) Cursor(key string, ascending bool) tsdb.Cursor { - // Retrieve key bucket. - b := tx.Bucket([]byte(key)) +// Cursor returns an iterator for a key over a single field. +func (tx *Tx) Cursor(series string, fields []string, dec *tsdb.FieldCodec, ascending bool) tsdb.Cursor { + // Retrieve series bucket. + b := tx.Bucket([]byte(series)) tx.engine.mu.RLock() defer tx.engine.mu.RUnlock() // Ignore if there is no bucket or points in the cache. - partitionID := WALPartition([]byte(key)) - if b == nil && len(tx.engine.cache[partitionID][key]) == 0 { + partitionID := WALPartition([]byte(series)) + if b == nil && len(tx.engine.cache[partitionID][series]) == 0 { return nil } - // Retrieve a copy of the in-cache points for the key. - cache := make([][]byte, len(tx.engine.cache[partitionID][key])) - copy(cache, tx.engine.cache[partitionID][key]) + // Retrieve a copy of the in-cache points for the series. + cache := make([][]byte, len(tx.engine.cache[partitionID][series])) + copy(cache, tx.engine.cache[partitionID][series]) // Build a cursor that merges the bucket and cache together. - cur := &Cursor{cache: cache, ascending: ascending} + cur := &Cursor{ + cache: cache, + fields: fields, + dec: dec, + ascending: ascending, + } if b != nil { cur.cursor = b.Cursor() } @@ -592,6 +597,10 @@ type Cursor struct { key, value []byte } + // Fields and codec. + fields []string + dec *tsdb.FieldCodec + // Cache and current cache index. cache [][]byte index int @@ -606,15 +615,16 @@ type Cursor struct { func (c *Cursor) Ascending() bool { return c.ascending } // Seek moves the cursor to a position and returns the closest key/value pair. -func (c *Cursor) Seek(seek []byte) (key, value []byte) { +func (c *Cursor) Seek(seek int64) (key int64, value interface{}) { // Seek bolt cursor. + seekBytes := u64tob(uint64(seek)) if c.cursor != nil { - c.buf.key, c.buf.value = c.cursor.Seek(seek) + c.buf.key, c.buf.value = c.cursor.Seek(seekBytes) } // Seek cache index. c.index = sort.Search(len(c.cache), func(i int) bool { - return bytes.Compare(c.cache[i][0:8], seek) != -1 + return bytes.Compare(c.cache[i][0:8], seekBytes) != -1 }) // Search will return an index after the length of cache if the seek value is greater @@ -628,28 +638,54 @@ func (c *Cursor) Seek(seek []byte) (key, value []byte) { } // Next returns the next key/value pair from the cursor. -func (c *Cursor) Next() (key, value []byte) { +func (c *Cursor) Next() (key int64, value interface{}) { return c.read() } // read returns the next key/value in the cursor buffer or cache. -func (c *Cursor) read() (key, value []byte) { +func (c *Cursor) read() (key int64, value interface{}) { // Continue skipping ahead through duplicate keys in the cache list. + var k, v []byte for { if c.ascending { - key, value = c.readForward() + k, v = c.readForward() } else { - key, value = c.readReverse() + k, v = c.readReverse() } // Exit loop if we're at the end of the cache or the next key is different. - if key == nil || !bytes.Equal(key, c.prev) { + if k == nil || !bytes.Equal(k, c.prev) { break } } - c.prev = key - return + // Save key so it's not re-read. + c.prev = k + + // Exit if no keys left. + if k == nil { + return tsdb.EOF, nil + } + + // Convert key to timestamp. + key = int64(btou64(k)) + + // Decode fields. Optimize for single field, if possible. + if len(c.fields) == 1 { + decValue, err := c.dec.DecodeByName(c.fields[0], v) + if err != nil { + return key, nil + } + return key, decValue + } else if len(c.fields) > 1 { + m, err := c.dec.DecodeFieldsWithNames(v) + if err != nil { + return key, nil + } + return key, m + } else { + return key, nil + } } // readForward returns the next key/value from the cursor and moves the current location forward. @@ -757,6 +793,9 @@ func u64tob(v uint64) []byte { return b } +// btou64 converts an 8-byte slice to a uint64. +func btou64(b []byte) uint64 { return binary.BigEndian.Uint64(b) } + // byteSlices represents a sortable slice of byte slices. type byteSlices [][]byte diff --git a/tsdb/engine/b1/b1_test.go b/tsdb/engine/b1/b1_test.go index 4589d1c30b..085f55ea75 100644 --- a/tsdb/engine/b1/b1_test.go +++ b/tsdb/engine/b1/b1_test.go @@ -1,7 +1,6 @@ package b1_test import ( - "bytes" "encoding/binary" "io/ioutil" "math" @@ -66,16 +65,14 @@ func TestEngine_WritePoints(t *testing.T) { tx := e.MustBegin(false) defer tx.Rollback() - c := tx.Cursor("temperature", true) - if k, v := c.Seek([]byte{0}); !bytes.Equal(k, u64tob(uint64(time.Unix(1434059627, 0).UnixNano()))) { + c := tx.Cursor("temperature", []string{"value"}, mf.Codec, true) + if k, v := c.Seek(0); k != 1434059627000000000 { t.Fatalf("unexpected key: %#v", k) - } else if m, err := mf.Codec.DecodeFieldsWithNames(v); err != nil { - t.Fatal(err) - } else if m["value"] != float64(200) { - t.Errorf("unexpected value: %#v", m) + } else if v == nil || v.(float64) != 200 { + t.Errorf("unexpected value: %#v", v) } - if k, v := c.Next(); k != nil { + if k, v := c.Next(); k != tsdb.EOF { t.Fatalf("unexpected key/value: %#v / %#v", k, v) } } @@ -131,18 +128,16 @@ func TestEngine_WritePoints_Reverse(t *testing.T) { tx := e.MustBegin(false) defer tx.Rollback() - c := tx.Cursor("temperature", false) - if k, _ := c.Seek(u64tob(math.MaxInt64)); !bytes.Equal(k, u64tob(uint64(time.Unix(1, 0).UnixNano()))) { - t.Fatalf("unexpected key: %v", btou64(k)) - } else if k, v := c.Next(); !bytes.Equal(k, u64tob(uint64(time.Unix(0, 0).UnixNano()))) { - t.Fatalf("unexpected key: %#v", k) - } else if m, err := mf.Codec.DecodeFieldsWithNames(v); err != nil { - t.Fatal(err) - } else if m["value"] != float64(100) { - t.Errorf("unexpected value: %#v", m) + c := tx.Cursor("temperature", []string{"value"}, mf.Codec, false) + if k, _ := c.Seek(math.MaxInt64); k != time.Unix(1, 0).UnixNano() { + t.Fatalf("unexpected key: %v", k) + } else if k, v := c.Next(); k != time.Unix(0, 0).UnixNano() { + t.Fatalf("unexpected key: %v", k) + } else if v == nil || v.(float64) != 100 { + t.Errorf("unexpected value: %#v", v) } - if k, v := c.Next(); k != nil { + if k, v := c.Next(); k != tsdb.EOF { t.Fatalf("unexpected key/value: %#v / %#v", k, v) } } diff --git a/tsdb/engine/bz1/bz1.go b/tsdb/engine/bz1/bz1.go index 7edc9a8291..ba565ecef1 100644 --- a/tsdb/engine/bz1/bz1.go +++ b/tsdb/engine/bz1/bz1.go @@ -74,7 +74,7 @@ type WAL interface { WritePoints(points []models.Point, measurementFieldsToSave map[string]*tsdb.MeasurementFields, seriesToCreate []*tsdb.SeriesCreate) error LoadMetadataIndex(index *tsdb.DatabaseIndex, measurementFields map[string]*tsdb.MeasurementFields) error DeleteSeries(keys []string) error - Cursor(key string, ascending bool) tsdb.Cursor + Cursor(series string, fields []string, dec *tsdb.FieldCodec, ascending bool) tsdb.Cursor Open() error Close() error Flush() error @@ -623,17 +623,19 @@ type Tx struct { } // Cursor returns an iterator for a key. -func (tx *Tx) Cursor(key string, ascending bool) tsdb.Cursor { - walCursor := tx.wal.Cursor(key, ascending) +func (tx *Tx) Cursor(series string, fields []string, dec *tsdb.FieldCodec, ascending bool) tsdb.Cursor { + walCursor := tx.wal.Cursor(series, fields, dec, ascending) // Retrieve points bucket. Ignore if there is no bucket. - b := tx.Bucket([]byte("points")).Bucket([]byte(key)) + b := tx.Bucket([]byte("points")).Bucket([]byte(series)) if b == nil { return walCursor } c := &Cursor{ cursor: b.Cursor(), + fields: fields, + dec: dec, ascending: ascending, } @@ -652,6 +654,9 @@ type Cursor struct { ascending bool fieldIndices []int index int + + fields []string + dec *tsdb.FieldCodec } func (c *Cursor) last() { @@ -662,23 +667,25 @@ func (c *Cursor) last() { func (c *Cursor) Ascending() bool { return c.ascending } // Seek moves the cursor to a position and returns the closest key/value pair. -func (c *Cursor) Seek(seek []byte) (key, value []byte) { +func (c *Cursor) Seek(seek int64) (key int64, value interface{}) { + seekBytes := u64tob(uint64(seek)) + // Move cursor to appropriate block and set to buffer. - k, v := c.cursor.Seek(seek) + k, v := c.cursor.Seek(seekBytes) if v == nil { // get the last block, it might have this time _, v = c.cursor.Last() - } else if bytes.Compare(seek, k) == -1 { // the seek key is less than this block, go back one and check + } else if seek < int64(btou64(k)) { // the seek key is less than this block, go back one and check _, v = c.cursor.Prev() // if the previous block max time is less than the seek value, reset to where we were originally - if v == nil || bytes.Compare(seek, v[0:8]) > 0 { - _, v = c.cursor.Seek(seek) + if v == nil || seek > int64(btou64(v[0:8])) { + _, v = c.cursor.Seek(seekBytes) } } c.setBuf(v) // Read current block up to seek position. - c.seekBuf(seek) + c.seekBuf(seekBytes) // Return current entry. return c.read() @@ -715,10 +722,10 @@ func (c *Cursor) seekBuf(seek []byte) (key, value []byte) { } // Next returns the next key/value pair from the cursor. -func (c *Cursor) Next() (key, value []byte) { +func (c *Cursor) Next() (key int64, value interface{}) { // Ignore if there is no buffer. if len(c.buf) == 0 { - return nil, nil + return tsdb.EOF, nil } if c.ascending { @@ -789,16 +796,17 @@ func (c *Cursor) setBuf(block []byte) { } // read reads the current key and value from the current block. -func (c *Cursor) read() (key, value []byte) { +func (c *Cursor) read() (key int64, value interface{}) { // Return nil if the offset is at the end of the buffer. if c.off >= len(c.buf) { - return nil, nil + return tsdb.EOF, nil } // Otherwise read the current entry. buf := c.buf[c.off:] dataSize := entryDataSize(buf) - return buf[0:8], buf[entryHeaderSize : entryHeaderSize+dataSize] + + return wal.DecodeKeyValue(c.fields, c.dec, buf[0:8], buf[entryHeaderSize:entryHeaderSize+dataSize]) } // MarshalEntry encodes point data into a single byte slice. diff --git a/tsdb/engine/bz1/bz1_test.go b/tsdb/engine/bz1/bz1_test.go index 957ec930af..b2c528ab99 100644 --- a/tsdb/engine/bz1/bz1_test.go +++ b/tsdb/engine/bz1/bz1_test.go @@ -1,39 +1,24 @@ package bz1_test import ( - "bytes" "encoding/binary" "errors" - "fmt" "io/ioutil" "math" - "math/rand" "os" "path/filepath" "reflect" - "sort" - "strconv" + "strings" "testing" - "testing/quick" "time" "github.com/influxdb/influxdb/influxql" "github.com/influxdb/influxdb/models" "github.com/influxdb/influxdb/tsdb" "github.com/influxdb/influxdb/tsdb/engine/bz1" - "github.com/influxdb/influxdb/tsdb/engine/wal" + //"github.com/influxdb/influxdb/tsdb/engine/wal" ) -var QuickConfig quick.Config - -func init() { - // Limit the number of iterations on CI so it doesn't take so long. - if os.Getenv("CI") == "true" { - QuickConfig.MaxCount = 10 - fmt.Fprintf(os.Stderr, "Limiting quickchecks to %d iterations (CI)\n", QuickConfig.MaxCount) - } -} - // Ensure the engine can write series metadata and reload it. func TestEngine_LoadMetadataIndex_Series(t *testing.T) { e := OpenDefaultEngine() @@ -159,14 +144,19 @@ func TestEngine_WriteIndex_Append(t *testing.T) { e := OpenDefaultEngine() defer e.Close() + // Create codec. + codec := tsdb.NewFieldCodec(map[string]*tsdb.Field{ + "value": {ID: uint8(1), Name: "value", Type: influxql.Float}, + }) + // Append points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(1), 0x10), - append(u64tob(2), 0x20), + append(u64tob(1), MustEncodeFields(codec, tsdb.Fields{"value": float64(10)})...), + append(u64tob(2), MustEncodeFields(codec, tsdb.Fields{"value": float64(20)})...), }, "mem": [][]byte{ - append(u64tob(0), 0x30), + append(u64tob(0), MustEncodeFields(codec, tsdb.Fields{"value": float64(30)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -177,20 +167,20 @@ func TestEngine_WriteIndex_Append(t *testing.T) { defer tx.Rollback() // Iterate over "cpu" series. - c := tx.Cursor("cpu", true) - if k, v := c.Seek(u64tob(0)); !reflect.DeepEqual(k, []byte{0, 0, 0, 0, 0, 0, 0, 1}) || !reflect.DeepEqual(v, []byte{0x10}) { + c := tx.Cursor("cpu", []string{"value"}, codec, true) + if k, v := c.Seek(0); k != 1 || v.(float64) != float64(10) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); !reflect.DeepEqual(k, []byte{0, 0, 0, 0, 0, 0, 0, 2}) || !reflect.DeepEqual(v, []byte{0x20}) { + } else if k, v = c.Next(); k != 2 || v.(float64) != float64(20) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, _ = c.Next(); k != nil { + } else if k, _ = c.Next(); k != tsdb.EOF { t.Fatalf("unexpected key/value: %x / %x", k, v) } // Iterate over "mem" series. - c = tx.Cursor("mem", true) - if k, v := c.Seek(u64tob(0)); !reflect.DeepEqual(k, []byte{0, 0, 0, 0, 0, 0, 0, 0}) || !reflect.DeepEqual(v, []byte{0x30}) { + c = tx.Cursor("mem", []string{"value"}, codec, true) + if k, v := c.Seek(0); k != 0 || v.(float64) != float64(30) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, _ = c.Next(); k != nil { + } else if k, _ = c.Next(); k != tsdb.EOF { t.Fatalf("unexpected key/value: %x / %x", k, v) } } @@ -200,12 +190,17 @@ func TestEngine_WriteIndex_Insert(t *testing.T) { e := OpenDefaultEngine() defer e.Close() + // Create codec. + codec := tsdb.NewFieldCodec(map[string]*tsdb.Field{ + "value": {ID: uint8(1), Name: "value", Type: influxql.Float}, + }) + // Write initial points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(10), 0x10), - append(u64tob(20), 0x20), - append(u64tob(30), 0x30), + append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": float64(10)})...), + append(u64tob(20), MustEncodeFields(codec, tsdb.Fields{"value": float64(20)})...), + append(u64tob(30), MustEncodeFields(codec, tsdb.Fields{"value": float64(30)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -214,10 +209,10 @@ func TestEngine_WriteIndex_Insert(t *testing.T) { // Write overlapping points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(9), 0x09), - append(u64tob(10), 0xFF), - append(u64tob(25), 0x25), - append(u64tob(31), 0x31), + append(u64tob(9), MustEncodeFields(codec, tsdb.Fields{"value": float64(9)})...), + append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": float64(255)})...), + append(u64tob(25), MustEncodeFields(codec, tsdb.Fields{"value": float64(25)})...), + append(u64tob(31), MustEncodeFields(codec, tsdb.Fields{"value": float64(31)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -226,7 +221,7 @@ func TestEngine_WriteIndex_Insert(t *testing.T) { // Write overlapping points to index again. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(31), 0xFF), + append(u64tob(31), MustEncodeFields(codec, tsdb.Fields{"value": float64(255)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -237,18 +232,18 @@ func TestEngine_WriteIndex_Insert(t *testing.T) { defer tx.Rollback() // Iterate over "cpu" series. - c := tx.Cursor("cpu", true) - if k, v := c.Seek(u64tob(0)); btou64(k) != 9 || !bytes.Equal(v, []byte{0x09}) { + c := tx.Cursor("cpu", []string{"value"}, codec, true) + if k, v := c.Seek(0); k != 9 || v.(float64) != float64(9) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); btou64(k) != 10 || !bytes.Equal(v, []byte{0xFF}) { + } else if k, v = c.Next(); k != 10 || v.(float64) != float64(255) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); btou64(k) != 20 || !bytes.Equal(v, []byte{0x20}) { + } else if k, v = c.Next(); k != 20 || v.(float64) != float64(20) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); btou64(k) != 25 || !bytes.Equal(v, []byte{0x25}) { + } else if k, v = c.Next(); k != 25 || v.(float64) != float64(25) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); btou64(k) != 30 || !bytes.Equal(v, []byte{0x30}) { + } else if k, v = c.Next(); k != 30 || v.(float64) != float64(30) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); btou64(k) != 31 || !bytes.Equal(v, []byte{0xFF}) { + } else if k, v = c.Next(); k != 31 || v.(float64) != float64(255) { t.Fatalf("unexpected key/value: %x / %x", k, v) } } @@ -258,12 +253,17 @@ func TestEngine_Cursor_Reverse(t *testing.T) { e := OpenDefaultEngine() defer e.Close() + // Create codec. + codec := tsdb.NewFieldCodec(map[string]*tsdb.Field{ + "value": {ID: uint8(1), Name: "value", Type: influxql.Float}, + }) + // Write initial points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(10), 0x10), - append(u64tob(20), 0x20), - append(u64tob(30), 0x30), + append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": float64(10)})...), + append(u64tob(20), MustEncodeFields(codec, tsdb.Fields{"value": float64(20)})...), + append(u64tob(30), MustEncodeFields(codec, tsdb.Fields{"value": float64(30)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -272,10 +272,10 @@ func TestEngine_Cursor_Reverse(t *testing.T) { // Write overlapping points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(9), 0x09), - append(u64tob(10), 0xFF), - append(u64tob(25), 0x25), - append(u64tob(31), 0x31), + append(u64tob(9), MustEncodeFields(codec, tsdb.Fields{"value": float64(9)})...), + append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": float64(255)})...), + append(u64tob(25), MustEncodeFields(codec, tsdb.Fields{"value": float64(25)})...), + append(u64tob(31), MustEncodeFields(codec, tsdb.Fields{"value": float64(31)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -284,7 +284,7 @@ func TestEngine_Cursor_Reverse(t *testing.T) { // Write overlapping points to index again. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(31), 0xFF), + append(u64tob(31), MustEncodeFields(codec, tsdb.Fields{"value": float64(255)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -295,18 +295,18 @@ func TestEngine_Cursor_Reverse(t *testing.T) { defer tx.Rollback() // Iterate over "cpu" series. - c := tx.Cursor("cpu", false) - if k, v := c.Seek(u64tob(math.MaxUint64)); btou64(k) != 31 || !bytes.Equal(v, []byte{0xFF}) { + c := tx.Cursor("cpu", []string{"value"}, codec, false) + if k, v := c.Seek(math.MaxInt64); k != 31 || v.(float64) != float64(255) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); btou64(k) != 30 || !bytes.Equal(v, []byte{0x30}) { + } else if k, v = c.Next(); k != 30 || v.(float64) != float64(30) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); btou64(k) != 25 || !bytes.Equal(v, []byte{0x25}) { + } else if k, v = c.Next(); k != 25 || v.(float64) != float64(25) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); btou64(k) != 20 || !bytes.Equal(v, []byte{0x20}) { + } else if k, v = c.Next(); k != 20 || v.(float64) != float64(20) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Next(); btou64(k) != 10 || !bytes.Equal(v, []byte{0xFF}) { + } else if k, v = c.Next(); k != 10 || v.(float64) != float64(255) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Seek(u64tob(0)); btou64(k) != 9 || !bytes.Equal(v, []byte{0x09}) { + } else if k, v = c.Seek(0); k != 9 || v.(float64) != float64(9) { t.Fatalf("unexpected key/value: %x / %x", k, v) } } @@ -316,16 +316,22 @@ func TestEngine_WriteIndex_SeekAgainstInBlockValue(t *testing.T) { e := OpenDefaultEngine() defer e.Close() + // Create codec. + codec := tsdb.NewFieldCodec(map[string]*tsdb.Field{ + "value": {ID: uint8(1), Name: "value", Type: influxql.String}, + }) + // make sure we have data split across two blocks dataSize := (bz1.DefaultBlockSize - 16) / 2 - data := make([]byte, dataSize, dataSize) + data := strings.Repeat("*", dataSize) + // Write initial points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(10), data...), - append(u64tob(20), data...), - append(u64tob(30), data...), - append(u64tob(40), data...), + append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": data})...), + append(u64tob(20), MustEncodeFields(codec, tsdb.Fields{"value": data})...), + append(u64tob(30), MustEncodeFields(codec, tsdb.Fields{"value": data})...), + append(u64tob(40), MustEncodeFields(codec, tsdb.Fields{"value": data})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -336,13 +342,13 @@ func TestEngine_WriteIndex_SeekAgainstInBlockValue(t *testing.T) { defer tx.Rollback() // Ensure that we can seek to a block in the middle - c := tx.Cursor("cpu", true) - if k, _ := c.Seek(u64tob(15)); btou64(k) != 20 { - t.Fatalf("expected to seek to time 20, but got %d", btou64(k)) + c := tx.Cursor("cpu", []string{"value"}, codec, true) + if k, _ := c.Seek(15); k != 20 { + t.Fatalf("expected to seek to time 20, but got %d", k) } // Ensure that we can seek to the block on the end - if k, _ := c.Seek(u64tob(35)); btou64(k) != 40 { - t.Fatalf("expected to seek to time 40, but got %d", btou64(k)) + if k, _ := c.Seek(35); k != 40 { + t.Fatalf("expected to seek to time 40, but got %d", k) } } @@ -364,156 +370,6 @@ func TestEngine_WriteIndex_NoPoints(t *testing.T) { } } -// Ensure the engine can accept randomly generated points. -func TestEngine_WriteIndex_Quick(t *testing.T) { - if testing.Short() { - t.Skip("short mode") - } - - quick.Check(func(sets []Points, blockSize uint) bool { - e := OpenDefaultEngine() - e.BlockSize = int(blockSize % 1024) // 1KB max block size - defer e.Close() - - // Write points to index in multiple sets. - for _, set := range sets { - if err := e.WriteIndex(map[string][][]byte(set), nil, nil); err != nil { - t.Fatal(err) - } - } - - // Merge all points together. - points := MergePoints(sets) - - // Retrieve a sorted list of keys so results are deterministic. - keys := points.Keys() - - // Start transaction to read index. - tx := e.MustBegin(false) - defer tx.Rollback() - - // Iterate over results to ensure they are correct. - for _, key := range keys { - c := tx.Cursor(key, true) - - // Read list of key/values. - var got [][]byte - for k, v := c.Seek(u64tob(0)); k != nil; k, v = c.Next() { - got = append(got, append(copyBytes(k), v...)) - } - - if !reflect.DeepEqual(got, points[key]) { - t.Fatalf("points: block size=%d, key=%s:\n\ngot=%x\n\nexp=%x\n\n", e.BlockSize, key, got, points[key]) - } - } - - return true - }, &QuickConfig) -} - -// Ensure the engine can accept randomly generated append-only points. -func TestEngine_WriteIndex_Quick_Append(t *testing.T) { - if testing.Short() { - t.Skip("short mode") - } - - quick.Check(func(sets appendPointSets, blockSize uint) bool { - e := OpenDefaultEngine() - e.BlockSize = int(blockSize % 1024) // 1KB max block size - defer e.Close() - - // Write points to index in multiple sets. - for _, set := range sets { - if err := e.WriteIndex(map[string][][]byte(set), nil, nil); err != nil { - t.Fatal(err) - } - } - - // Merge all points together. - points := MergePoints([]Points(sets)) - - // Retrieve a sorted list of keys so results are deterministic. - keys := points.Keys() - - // Start transaction to read index. - tx := e.MustBegin(false) - defer tx.Rollback() - - // Iterate over results to ensure they are correct. - for _, key := range keys { - c := tx.Cursor(key, true) - - // Read list of key/values. - var got [][]byte - for k, v := c.Seek(u64tob(0)); k != nil; k, v = c.Next() { - got = append(got, append(copyBytes(k), v...)) - } - - if !reflect.DeepEqual(got, points[key]) { - t.Fatalf("points: block size=%d, key=%s:\n\ngot=%x\n\nexp=%x\n\n", e.BlockSize, key, got, points[key]) - } - } - - return true - }, &QuickConfig) -} - -func BenchmarkEngine_WriteIndex_512b(b *testing.B) { benchmarkEngine_WriteIndex(b, 512) } -func BenchmarkEngine_WriteIndex_1KB(b *testing.B) { benchmarkEngine_WriteIndex(b, 1*1024) } -func BenchmarkEngine_WriteIndex_4KB(b *testing.B) { benchmarkEngine_WriteIndex(b, 4*1024) } -func BenchmarkEngine_WriteIndex_16KB(b *testing.B) { benchmarkEngine_WriteIndex(b, 16*1024) } -func BenchmarkEngine_WriteIndex_32KB(b *testing.B) { benchmarkEngine_WriteIndex(b, 32*1024) } -func BenchmarkEngine_WriteIndex_64KB(b *testing.B) { benchmarkEngine_WriteIndex(b, 64*1024) } -func BenchmarkEngine_WriteIndex_128KB(b *testing.B) { benchmarkEngine_WriteIndex(b, 128*1024) } -func BenchmarkEngine_WriteIndex_256KB(b *testing.B) { benchmarkEngine_WriteIndex(b, 256*1024) } - -func benchmarkEngine_WriteIndex(b *testing.B, blockSize int) { - // Skip small iterations. - if b.N < 1000000 { - return - } - - // Create a simple engine. - e := OpenDefaultEngine() - e.BlockSize = blockSize - defer e.Close() - - // Create codec. - codec := tsdb.NewFieldCodec(map[string]*tsdb.Field{ - "value": { - ID: uint8(1), - Name: "value", - Type: influxql.Float, - }, - }) - - // Generate points. - a := make(map[string][][]byte) - a["cpu"] = make([][]byte, b.N) - for i := 0; i < b.N; i++ { - a["cpu"][i] = wal.MarshalEntry(int64(i), MustEncodeFields(codec, models.Fields{"value": float64(i)})) - } - - b.ResetTimer() - - // Insert into engine. - if err := e.WriteIndex(a, nil, nil); err != nil { - b.Fatal(err) - } - - // Calculate on-disk size per point. - bs, _ := e.SeriesBucketStats("cpu") - stats, err := e.Stats() - if err != nil { - b.Fatal(err) - } - b.Logf("pts=%9d bytes/pt=%4.01f leaf-util=%3.0f%%", - b.N, - float64(stats.Size)/float64(b.N), - (float64(bs.LeafInuse)/float64(bs.LeafAlloc))*100.0, - ) -} - // Engine represents a test wrapper for bz1.Engine. type Engine struct { *bz1.Engine @@ -583,7 +439,7 @@ func (w *EnginePointsWriter) Open() error { return nil } func (w *EnginePointsWriter) Close() error { return nil } -func (w *EnginePointsWriter) Cursor(key string, ascending bool) tsdb.Cursor { +func (w *EnginePointsWriter) Cursor(series string, fields []string, dec *tsdb.FieldCodec, ascending bool) tsdb.Cursor { return &Cursor{ascending: ascending} } @@ -596,83 +452,9 @@ type Cursor struct { func (c *Cursor) Ascending() bool { return c.ascending } -func (c *Cursor) Seek(key []byte) ([]byte, []byte) { return nil, nil } +func (c *Cursor) Seek(key int64) (int64, interface{}) { return tsdb.EOF, nil } -func (c *Cursor) Next() ([]byte, []byte) { return nil, nil } - -// Points represents a set of encoded points by key. Implements quick.Generator. -type Points map[string][][]byte - -// Keys returns a sorted list of keys. -func (m Points) Keys() []string { - var keys []string - for k := range m { - keys = append(keys, k) - } - sort.Strings(keys) - return keys -} - -func (Points) Generate(rand *rand.Rand, size int) reflect.Value { - return reflect.ValueOf(Points(GeneratePoints(rand, size, - rand.Intn(size), - func(_ int) time.Time { return time.Unix(0, 0).Add(time.Duration(rand.Intn(100))) }, - ))) -} - -// appendPointSets represents sets of sequential points. Implements quick.Generator. -type appendPointSets []Points - -func (appendPointSets) Generate(rand *rand.Rand, size int) reflect.Value { - sets := make([]Points, 0) - for i, n := 0, rand.Intn(size); i < n; i++ { - sets = append(sets, GeneratePoints(rand, size, - rand.Intn(size), - func(j int) time.Time { - return time.Unix(0, 0).Add((time.Duration(i) * time.Second) + (time.Duration(j) * time.Nanosecond)) - }, - )) - } - return reflect.ValueOf(appendPointSets(sets)) -} - -func GeneratePoints(rand *rand.Rand, size, seriesN int, timestampFn func(int) time.Time) Points { - // Generate series with a random number of points in each. - m := make(Points) - for i := 0; i < seriesN; i++ { - key := strconv.Itoa(i) - - // Generate points for the series. - for j, pointN := 0, rand.Intn(size); j < pointN; j++ { - timestamp := timestampFn(j) - data, ok := quick.Value(reflect.TypeOf([]byte(nil)), rand) - if !ok { - panic("cannot generate data") - } - m[key] = append(m[key], bz1.MarshalEntry(timestamp.UnixNano(), data.Interface().([]byte))) - } - } - return m -} - -// MergePoints returns a map of all points merged together by key. -// Later points will overwrite earlier ones. -func MergePoints(a []Points) Points { - // Combine all points into one set. - m := make(Points) - for _, set := range a { - for key, values := range set { - m[key] = append(m[key], values...) - } - } - - // Dedupe points. - for key, values := range m { - m[key] = tsdb.DedupeEntries(values) - } - - return m -} +func (c *Cursor) Next() (int64, interface{}) { return tsdb.EOF, nil } // MustEncodeFields encodes fields with codec. Panic on error. func MustEncodeFields(codec *tsdb.FieldCodec, fields models.Fields) []byte { diff --git a/tsdb/engine/wal/wal.go b/tsdb/engine/wal/wal.go index bd939a7bb4..11ba0136e1 100644 --- a/tsdb/engine/wal/wal.go +++ b/tsdb/engine/wal/wal.go @@ -255,10 +255,10 @@ func (l *Log) DiskSize() (int64, error) { } // Cursor will return a cursor object to Seek and iterate with Next for the WAL cache for the given -func (l *Log) Cursor(key string, ascending bool) tsdb.Cursor { +func (l *Log) Cursor(series string, fields []string, dec *tsdb.FieldCodec, ascending bool) tsdb.Cursor { l.mu.RLock() defer l.mu.RUnlock() - return l.partition.cursor(key, ascending) + return l.partition.cursor(series, fields, dec, ascending) } func (l *Log) WritePoints(points []models.Point, fields map[string]*tsdb.MeasurementFields, series []*tsdb.SeriesCreate) error { @@ -1214,11 +1214,11 @@ func (p *Partition) addToCache(key, data []byte, timestamp int64) { } // cursor will combine the in memory cache and flush cache (if a flush is currently happening) to give a single ordered cursor for the key -func (p *Partition) cursor(key string, ascending bool) *cursor { +func (p *Partition) cursor(series string, fields []string, dec *tsdb.FieldCodec, ascending bool) *cursor { p.mu.Lock() defer p.mu.Unlock() - entry := p.cache[key] + entry := p.cache[series] if entry == nil { entry = &cacheEntry{} } @@ -1226,13 +1226,13 @@ func (p *Partition) cursor(key string, ascending bool) *cursor { // if we're in the middle of a flush, combine the previous cache // with this one for the cursor if p.flushCache != nil { - if fc, ok := p.flushCache[key]; ok { + if fc, ok := p.flushCache[series]; ok { c := make([][]byte, len(fc), len(fc)+len(entry.points)) copy(c, fc) c = append(c, entry.points...) dedupe := tsdb.DedupeEntries(c) - return newCursor(dedupe, ascending) + return newCursor(dedupe, fields, dec, ascending) } } @@ -1241,10 +1241,11 @@ func (p *Partition) cursor(key string, ascending bool) *cursor { entry.isDirtySort = false } - // build a copy so modifications to the partition don't change the result set + // Build a copy so modifications to the partition don't change the result set a := make([][]byte, len(entry.points)) copy(a, entry.points) - return newCursor(a, ascending) + + return newCursor(a, fields, dec, ascending) } // idFromFileName parses the segment file ID from its name @@ -1408,15 +1409,20 @@ type cursor struct { cache [][]byte position int ascending bool + + fields []string + dec *tsdb.FieldCodec } -func newCursor(cache [][]byte, ascending bool) *cursor { +func newCursor(cache [][]byte, fields []string, dec *tsdb.FieldCodec, ascending bool) *cursor { // position is set such that a call to Next will successfully advance // to the next postion and return the value. c := &cursor{ cache: cache, ascending: ascending, position: -1, + fields: fields, + dec: dec, } if !ascending { c.position = len(c.cache) @@ -1427,10 +1433,12 @@ func newCursor(cache [][]byte, ascending bool) *cursor { func (c *cursor) Ascending() bool { return c.ascending } // Seek will point the cursor to the given time (or key) -func (c *cursor) Seek(seek []byte) (key, value []byte) { +func (c *cursor) Seek(seek int64) (key int64, value interface{}) { + seekBytes := u64tob(uint64(seek)) + // Seek cache index c.position = sort.Search(len(c.cache), func(i int) bool { - return bytes.Compare(c.cache[i][0:8], seek) != -1 + return bytes.Compare(c.cache[i][0:8], seekBytes) != -1 }) // If seek is not in the cache, return the last value in the cache @@ -1440,20 +1448,20 @@ func (c *cursor) Seek(seek []byte) (key, value []byte) { // Make sure our position points to something in the cache if c.position < 0 || c.position >= len(c.cache) { - return nil, nil + return tsdb.EOF, nil } v := c.cache[c.position] if v == nil { - return nil, nil + return tsdb.EOF, nil } - return v[0:8], v[8:] + return DecodeKeyValue(c.fields, c.dec, v[0:8], v[8:]) } // Next moves the cursor to the next key/value. will return nil if at the end -func (c *cursor) Next() (key, value []byte) { +func (c *cursor) Next() (key int64, value interface{}) { var v []byte if c.ascending { v = c.nextForward() @@ -1463,11 +1471,11 @@ func (c *cursor) Next() (key, value []byte) { // Iterated past the end of the cursor if v == nil { - return nil, nil + return tsdb.EOF, nil } // Split v into key/value - return v[0:8], v[8:] + return DecodeKeyValue(c.fields, c.dec, v[0:8], v[8:]) } // nextForward advances the cursor forward returning the next value @@ -1578,3 +1586,27 @@ func u64tob(v uint64) []byte { func btou64(b []byte) uint64 { return binary.BigEndian.Uint64(b) } + +// DecodeKeyValue decodes the key and value from bytes. +func DecodeKeyValue(fields []string, dec *tsdb.FieldCodec, k, v []byte) (key int64, value interface{}) { + // Convert key to a timestamp. + key = int64(btou64(k[0:8])) + + // Decode values. Optimize for single field. + switch len(fields) { + case 0: + return + case 1: + decValue, err := dec.DecodeByName(fields[0], v) + if err != nil { + return + } + return key, decValue + default: + m, err := dec.DecodeFieldsWithNames(v) + if err != nil { + return + } + return key, m + } +} diff --git a/tsdb/engine/wal/wal_test.go b/tsdb/engine/wal/wal_test.go index 03fb4c9e4f..4905fe1fad 100644 --- a/tsdb/engine/wal/wal_test.go +++ b/tsdb/engine/wal/wal_test.go @@ -2,7 +2,6 @@ package wal import ( "bytes" - "encoding/binary" "fmt" "io/ioutil" "math/rand" @@ -33,7 +32,7 @@ func TestWAL_WritePoints(t *testing.T) { }, }) - // test that we can write to two different series + // Test that we can write to two different series p1 := parsePoint("cpu,host=A value=23.2 1", codec) p2 := parsePoint("cpu,host=A value=25.3 4", codec) p3 := parsePoint("cpu,host=B value=1.0 1", codec) @@ -41,27 +40,27 @@ func TestWAL_WritePoints(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", true) - k, v := c.Seek(inttob(1)) + c := log.Cursor("cpu,host=A", []string{"value"}, codec, true) + k, v := c.Seek(1) // ensure the series are there and points are in order - if bytes.Compare(v, p1.Data()) != 0 { + if v.(float64) != 23.2 { t.Fatalf("expected to seek to first point but got key and value: %v %v", k, v) } k, v = c.Next() - if bytes.Compare(v, p2.Data()) != 0 { + if v.(float64) != 25.3 { t.Fatalf("expected to seek to first point but got key and value: %v %v", k, v) } k, v = c.Next() - if k != nil { + if k != tsdb.EOF { t.Fatalf("expected nil on last seek: %v %v", k, v) } - c = log.Cursor("cpu,host=B", true) + c = log.Cursor("cpu,host=B", []string{"value"}, codec, true) k, v = c.Next() - if bytes.Compare(v, p3.Data()) != 0 { + if v.(float64) != 1.0 { t.Fatalf("expected to seek to first point but got key and value: %v %v", k, v) } @@ -98,19 +97,16 @@ func TestWAL_WritePoints(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c = log.Cursor("cpu,host=A", true) - k, v = c.Next() - if bytes.Compare(v, p6.Data()) != 0 { + c = log.Cursor("cpu,host=A", []string{"value"}, codec, true) + if _, v := c.Next(); v.(float64) != 1.3 { t.Fatal("order wrong, expected p6") } - _, v = c.Next() - if bytes.Compare(v, p4.Data()) != 0 { + if _, v := c.Next(); v.(float64) != 1.0 { t.Fatal("order wrong, expected p6") } - c = log.Cursor("cpu,host=C", true) - _, v = c.Next() - if bytes.Compare(v, p5.Data()) != 0 { + c = log.Cursor("cpu,host=C", []string{"value"}, codec, true) + if _, v := c.Next(); v.(float64) != 1.4 { t.Fatal("order wrong, expected p6") } @@ -156,17 +152,14 @@ func TestWAL_CorruptDataLengthSize(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", true) - _, v := c.Next() - if bytes.Compare(v, p1.Data()) != 0 { + c := log.Cursor("cpu,host=A", []string{"value"}, codec, true) + if _, v := c.Next(); v.(float64) != 23.2 { t.Fatal("p1 value wrong") } - _, v = c.Next() - if bytes.Compare(v, p2.Data()) != 0 { + if _, v := c.Next(); v.(float64) != 25.3 { t.Fatal("p2 value wrong") } - _, v = c.Next() - if v != nil { + if _, v := c.Next(); v != nil { t.Fatal("expected cursor to return nil") } @@ -184,8 +177,7 @@ func TestWAL_CorruptDataLengthSize(t *testing.T) { log.Open() - p := points[0] - if len(p["cpu,host=A"]) != 2 { + if p := points[0]; len(p["cpu,host=A"]) != 2 { t.Fatal("expected two points for cpu,host=A") } @@ -195,9 +187,8 @@ func TestWAL_CorruptDataLengthSize(t *testing.T) { t.Fatalf("failed to write point: %s", err.Error()) } - c = log.Cursor("cpu,host=A", true) - _, v = c.Next() - if bytes.Compare(v, p3.Data()) != 0 { + c = log.Cursor("cpu,host=A", []string{"value"}, codec, true) + if _, v := c.Next(); v.(float64) != 29.2 { t.Fatal("p3 value wrong") } @@ -205,8 +196,7 @@ func TestWAL_CorruptDataLengthSize(t *testing.T) { points = make([]map[string][][]byte, 0) log.Open() - p = points[0] - if len(p["cpu,host=A"]) != 1 { + if p := points[0]; len(p["cpu,host=A"]) != 1 { t.Fatal("expected two points for cpu,host=A") } } @@ -235,17 +225,14 @@ func TestWAL_CorruptDataBlock(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", true) - _, v := c.Next() - if bytes.Compare(v, p1.Data()) != 0 { + c := log.Cursor("cpu,host=A", []string{"value"}, codec, true) + if _, v := c.Next(); v.(float64) != 23.2 { t.Fatal("p1 value wrong") } - _, v = c.Next() - if bytes.Compare(v, p2.Data()) != 0 { + if _, v := c.Next(); v.(float64) != 25.3 { t.Fatal("p2 value wrong") } - _, v = c.Next() - if v != nil { + if _, v := c.Next(); v != nil { t.Fatal("expected cursor to return nil") } @@ -268,9 +255,7 @@ func TestWAL_CorruptDataBlock(t *testing.T) { }} log.Open() - - p := points[0] - if len(p["cpu,host=A"]) != 2 { + if p := points[0]; len(p["cpu,host=A"]) != 2 { t.Fatal("expected two points for cpu,host=A") } @@ -280,9 +265,8 @@ func TestWAL_CorruptDataBlock(t *testing.T) { t.Fatalf("failed to write point: %s", err.Error()) } - c = log.Cursor("cpu,host=A", true) - _, v = c.Next() - if bytes.Compare(v, p3.Data()) != 0 { + c = log.Cursor("cpu,host=A", []string{"value"}, codec, true) + if _, v := c.Next(); v.(float64) != 29.2 { t.Fatal("p3 value wrong", p3.Data(), v) } @@ -290,8 +274,7 @@ func TestWAL_CorruptDataBlock(t *testing.T) { points = make([]map[string][][]byte, 0) log.Open() - p = points[0] - if len(p["cpu,host=A"]) != 1 { + if p := points[0]; len(p["cpu,host=A"]) != 1 { t.Fatal("expected two points for cpu,host=A") } } @@ -341,9 +324,9 @@ func TestWAL_CompactAfterTimeWithoutWrite(t *testing.T) { } // ensure we have some data - c := log.Cursor("cpu,host=A,region=uswest10", true) + c := log.Cursor("cpu,host=A,region=uswest10", []string{"value"}, codec, true) k, _ := c.Next() - if btou64(k) != 1 { + if k != 1 { t.Fatalf("expected first data point but got one with key: %v", k) } @@ -524,13 +507,13 @@ func TestWAL_DeleteSeries(t *testing.T) { } // ensure data is there - c := log.Cursor("cpu,host=A", true) - if k, _ := c.Next(); btou64(k) != 1 { + c := log.Cursor("cpu,host=A", []string{"value"}, codec, true) + if k, _ := c.Next(); k != 1 { t.Fatal("expected data point for cpu,host=A") } - c = log.Cursor("cpu,host=B", true) - if k, _ := c.Next(); btou64(k) != 2 { + c = log.Cursor("cpu,host=B", []string{"value"}, codec, true) + if k, _ := c.Next(); k != 2 { t.Fatal("expected data point for cpu,host=B") } @@ -546,14 +529,14 @@ func TestWAL_DeleteSeries(t *testing.T) { if len(points["cpu,host=B"]) != 0 { t.Fatal("expected cpu,host=B to have no points in index") } - c = log.Cursor("cpu,host=A", true) - if k, _ := c.Next(); k != nil { + c = log.Cursor("cpu,host=A", []string{"value"}, codec, true) + if k, _ := c.Next(); k != tsdb.EOF { t.Fatal("expected data to be out of the cache cpu,host=A") } // ensure series is deleted - c = log.Cursor("cpu,host=B", true) - if k, _ := c.Next(); k != nil { + c = log.Cursor("cpu,host=B", []string{"value"}, codec, true) + if k, _ := c.Next(); k != tsdb.EOF { t.Fatal("expected no data for cpu,host=B") } @@ -618,10 +601,10 @@ func TestWAL_QueryDuringCompaction(t *testing.T) { } verify := func() { - c := log.Cursor("cpu,host=A", true) - k, v := c.Seek(inttob(1)) + c := log.Cursor("cpu,host=A", []string{"value"}, codec, true) + k, v := c.Seek(1) // ensure the series are there and points are in order - if bytes.Compare(v, p1.Data()) != 0 { + if v.(float64) != 23.2 { <-finishCompaction t.Fatalf("expected to seek to first point but got key and value: %v %v", k, v) } @@ -664,21 +647,17 @@ func TestWAL_PointsSorted(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", true) - k, _ := c.Next() - if btou64(k) != 1 { + c := log.Cursor("cpu,host=A", []string{"value"}, codec, true) + if k, _ := c.Next(); k != 1 { t.Fatal("points out of order") } - k, _ = c.Next() - if btou64(k) != 2 { + if k, _ := c.Next(); k != 2 { t.Fatal("points out of order") } - k, _ = c.Next() - if btou64(k) != 4 { + if k, _ := c.Next(); k != 4 { t.Fatal("points out of order") } - k, _ = c.Next() - if btou64(k) != 6 { + if k, _ := c.Next(); k != 6 { t.Fatal("points out of order") } } @@ -709,21 +688,18 @@ func TestWAL_Cursor_Reverse(t *testing.T) { t.Fatalf("failed to write points: %s", err.Error()) } - c := log.Cursor("cpu,host=A", false) + c := log.Cursor("cpu,host=A", []string{"value"}, codec, false) k, _ := c.Next() - if btou64(k) != 6 { + if k != 6 { t.Fatal("points out of order") } - k, _ = c.Next() - if btou64(k) != 4 { + if k, _ := c.Next(); k != 4 { t.Fatal("points out of order") } - k, _ = c.Next() - if btou64(k) != 2 { + if k, _ := c.Next(); k != 2 { t.Fatal("points out of order") } - k, _ = c.Next() - if btou64(k) != 1 { + if k, _ := c.Next(); k != 1 { t.Fatal("points out of order") } } @@ -762,9 +738,3 @@ func parsePoints(buf string, codec *tsdb.FieldCodec) []models.Point { func parsePoint(buf string, codec *tsdb.FieldCodec) models.Point { return parsePoints(buf, codec)[0] } - -func inttob(v int) []byte { - b := make([]byte, 8) - binary.BigEndian.PutUint64(b, uint64(v)) - return b -} diff --git a/tsdb/mapper.go b/tsdb/mapper.go index 4b4316c409..7ed0bf5c12 100644 --- a/tsdb/mapper.go +++ b/tsdb/mapper.go @@ -185,35 +185,20 @@ func (m *RawMapper) Open() error { } m.tx = tx - selectFields := newStringSet() - selectTags := newStringSet() - whereFields := newStringSet() + // Collect measurements. + mms := Measurements(m.shard.index.MeasurementsByName(m.stmt.SourceNames())) + m.selectFields = mms.SelectFields(m.stmt) + m.selectTags = mms.SelectTags(m.stmt) + m.whereFields = mms.WhereFields(m.stmt) // Open cursors for each measurement. - for _, src := range m.stmt.Sources { - // Retrieve measurement index reference. Ignore if not exists. - mm := m.shard.index.Measurement(src.(*influxql.Measurement).Name) - if mm == nil { - continue - } - - // Open cursors for measurement. - info, err := m.openMeasurement(mm) - if err != nil { + for _, mm := range mms { + if err := m.openMeasurement(mm); err != nil { return err } - - // Append fields & tags. - selectFields.add(info.SelectFields...) - selectTags.add(info.SelectTags...) - whereFields.add(info.WhereFields...) } - m.selectFields = selectFields.list() - m.selectTags = selectTags.list() - m.whereFields = whereFields.list() - - // Remove cursors if no SELECT fields are present. + // Remove cursors if there are not SELECT fields. if len(m.selectFields) == 0 { m.cursors = nil } @@ -221,41 +206,59 @@ func (m *RawMapper) Open() error { return nil } -func (m *RawMapper) openMeasurement(mm *Measurement) (SelectInfo, error) { - // Validate and return selection info. - info, err := mm.ValidateSelectStatement(m.stmt) - if err != nil { - return info, err +func (m *RawMapper) openMeasurement(mm *Measurement) error { + // Validate that ANY GROUP BY is not a field for the measurement. + if err := mm.ValidateGroupBy(m.stmt); err != nil { + return err } + // Validate the fields and tags asked for exist and keep track of which are in the select vs the where + selectFields := mm.SelectFields(m.stmt) + selectTags := mm.SelectTags(m.stmt) + + // If we only have tags in our select clause we just return + if len(selectFields) == 0 && len(selectTags) > 0 { + return fmt.Errorf("statement must have at least one field in select clause") + } + + // Calculate tag sets and apply SLIMIT/SOFFSET. + tagSets, err := mm.DimensionTagSets(m.stmt) + if err != nil { + return err + } + tagSets = m.stmt.LimitTagSets(tagSets) + // Create all cursors for reading the data from this shard. ascending := m.stmt.TimeAscending() - for _, t := range info.TagSets { - cursors := []*seriesCursor{} + for _, t := range tagSets { + cursors := []*TagsCursor{} for i, key := range t.SeriesKeys { - c := m.tx.Cursor(key, ascending) + c := m.tx.Cursor(key, selectFields, m.shard.FieldCodec(mm.Name), ascending) if c == nil { continue } seriesTags := m.shard.index.TagsForSeries(key) - cm := newSeriesCursor(c, t.Filters[i], seriesTags) + cm := NewTagsCursor(c, t.Filters[i], seriesTags) cursors = append(cursors, cm) } - tsc := NewTagSetCursor(mm.Name, t.Tags, cursors, m.shard.FieldCodec(mm.Name)) + tsc := NewTagSetCursor(mm.Name, t.Tags, cursors) + tsc.SelectFields = m.selectFields + tsc.WhereFields = m.whereFields if ascending { - tsc.SeekTo(m.qmin) + tsc.Init(m.qmin) } else { - tsc.SeekTo(m.qmax) + tsc.Init(m.qmax) } + m.cursors = append(m.cursors, tsc) } sort.Sort(TagSetCursors(m.cursors)) - return info, nil + return nil } // Close closes the mapper. @@ -284,7 +287,7 @@ func (m *RawMapper) NextChunk() (interface{}, error) { cursor := m.cursors[m.cursorIndex] - k, v := cursor.Next(m.qmin, m.qmax, m.selectFields, m.whereFields) + k, v := cursor.Next(m.qmin, m.qmax) if v == nil { // Tagset cursor is empty, move to next one. m.cursorIndex++ @@ -417,66 +420,66 @@ func (m *AggregateMapper) Open() error { } m.tx = tx - selectFields := newStringSet() - selectTags := newStringSet() - whereFields := newStringSet() + // Collect measurements. + mms := Measurements(m.shard.index.MeasurementsByName(m.stmt.SourceNames())) + m.selectFields = mms.SelectFields(m.stmt) + m.selectTags = mms.SelectTags(m.stmt) + m.whereFields = mms.WhereFields(m.stmt) // Open cursors for each measurement. - for _, src := range m.stmt.Sources { - // Retrieve measurement index reference. Ignore if not exists. - mm := m.shard.index.Measurement(src.(*influxql.Measurement).Name) - if mm == nil { - continue - } - - // Open cursors for measurement. - info, err := m.openMeasurement(mm) - if err != nil { + for _, mm := range mms { + if err := m.openMeasurement(mm); err != nil { return err } - - // Append fields & tags. - selectFields.add(info.SelectFields...) - selectTags.add(info.SelectTags...) - whereFields.add(info.WhereFields...) } - m.selectFields = selectFields.list() - m.selectTags = selectTags.list() - m.whereFields = whereFields.list() - return nil } -func (m *AggregateMapper) openMeasurement(mm *Measurement) (SelectInfo, error) { - // Validate and return selection info. - info, err := mm.ValidateSelectStatement(m.stmt) - if err != nil { - return info, err +func (m *AggregateMapper) openMeasurement(mm *Measurement) error { + // Validate that ANY GROUP BY is not a field for the measurement. + if err := mm.ValidateGroupBy(m.stmt); err != nil { + return err } + // Validate the fields and tags asked for exist and keep track of which are in the select vs the where + selectFields := mm.SelectFields(m.stmt) + selectTags := mm.SelectTags(m.stmt) + + // If we only have tags in our select clause we just return + if len(selectFields) == 0 && len(selectTags) > 0 { + return fmt.Errorf("statement must have at least one field in select clause") + } + + // Calculate tag sets and apply SLIMIT/SOFFSET. + tagSets, err := mm.DimensionTagSets(m.stmt) + if err != nil { + return err + } + tagSets = m.stmt.LimitTagSets(tagSets) + // Create all cursors for reading the data from this shard. - for _, t := range info.TagSets { - cursors := []*seriesCursor{} + for _, t := range tagSets { + cursors := []*TagsCursor{} for i, key := range t.SeriesKeys { - c := m.tx.Cursor(key, true) + c := m.tx.Cursor(key, selectFields, m.shard.FieldCodec(mm.Name), true) if c == nil { continue } seriesTags := m.shard.index.TagsForSeries(key) - cursors = append(cursors, newSeriesCursor(c, t.Filters[i], seriesTags)) + cursors = append(cursors, NewTagsCursor(c, t.Filters[i], seriesTags)) } - tsc := NewTagSetCursor(mm.Name, t.Tags, cursors, m.shard.FieldCodec(mm.Name)) - tsc.SeekTo(m.qmin) + tsc := NewTagSetCursor(mm.Name, t.Tags, cursors) + tsc.Init(m.qmin) m.cursors = append(m.cursors, tsc) } sort.Sort(TagSetCursors(m.cursors)) - return info, nil + return nil } // initializeMapFunctions initialize the mapping functions for the mapper. @@ -577,25 +580,28 @@ func (m *AggregateMapper) NextChunk() (interface{}, error) { qmax = m.qmax + 1 } - tsc.pointHeap = newPointHeap() + tsc.heap = newPointHeap() for i := range m.mapFuncs { // Prime the tagset cursor for the start of the interval. This is not ideal, as // it should really calculate the values all in 1 pass, but that would require // changes to the mapper functions, which can come later. // Prime the buffers. for i := 0; i < len(tsc.cursors); i++ { - k, v := tsc.cursors[i].SeekTo(qmin) + k, v := tsc.cursors[i].Seek(qmin) if k == -1 || k > tmax { continue } - p := &pointHeapItem{ + + heap.Push(tsc.heap, &pointHeapItem{ timestamp: k, value: v, cursor: tsc.cursors[i], - } - heap.Push(tsc.pointHeap, p) + }) } + tsc.SelectFields = []string{m.fieldNames[i]} + tsc.WhereFields = m.whereFields + // Execute the map function which walks the entire interval, and aggregates the result. output.Values[0].Value = append( output.Values[0].Value.([]interface{}), @@ -606,9 +612,6 @@ func (m *AggregateMapper) NextChunk() (interface{}, error) { qmin: qmin, qmax: qmax, - - selectFields: []string{m.fieldNames[i]}, - whereFields: m.whereFields, }), ) } @@ -634,18 +637,16 @@ func (m *AggregateMapper) nextInterval() (start, end int64) { // AggregateTagSetCursor wraps a standard tagSetCursor, such that the values it emits are aggregated by intervals. type AggregateTagSetCursor struct { cursor *TagSetCursor + qmin int64 + qmax int64 tmin int64 stmt *influxql.SelectStatement - - qmin, qmax int64 - selectFields []string - whereFields []string } // Next returns the next aggregate value for the cursor. func (a *AggregateTagSetCursor) Next() (time int64, value interface{}) { - return a.cursor.Next(a.qmin, a.qmax, a.selectFields, a.whereFields) + return a.cursor.Next(a.qmin, a.qmax) } // Tags returns the current tags for the cursor diff --git a/tsdb/meta.go b/tsdb/meta.go index 1f3a4dd789..1c3f2d8127 100644 --- a/tsdb/meta.go +++ b/tsdb/meta.go @@ -59,6 +59,20 @@ func (d *DatabaseIndex) Measurement(name string) *Measurement { return d.measurements[name] } +// MeasurementsByName returns a list of measurements. +func (d *DatabaseIndex) MeasurementsByName(names []string) []*Measurement { + d.mu.RLock() + defer d.mu.RUnlock() + + a := make([]*Measurement, 0, len(names)) + for _, name := range names { + if m := d.measurements[name]; m != nil { + a = append(a, m) + } + } + return a +} + // MeasurementSeriesCounts returns the number of measurements and series currently indexed by the database. // Useful for reporting and monitoring. func (d *DatabaseIndex) MeasurementSeriesCounts() (nMeasurements int, nSeries int) { @@ -1039,58 +1053,6 @@ func (m *Measurement) uniqueTagValues(expr influxql.Expr) map[string][]string { return out } -// ValidateSelectStatement validates stmt against m. Also returns a list of fields & tagsets. -func (m *Measurement) ValidateSelectStatement(stmt *influxql.SelectStatement) (SelectInfo, error) { - var info SelectInfo - - // Validate that ANY GROUP BY is not a field for the measurement. - if err := m.ValidateGroupBy(stmt); err != nil { - return info, err - } - - // Validate the fields and tags asked for exist and keep track of which are in the select vs the where - info.SelectFields = m.SelectFields(stmt) - info.SelectTags = m.SelectTags(stmt) - info.WhereFields = m.WhereFields(stmt) - - tagSets, err := m.DimensionTagSets(stmt) - if err != nil { - return info, err - } - info.TagSets = tagSets - - // return &tagSetsAndFields{ - // tagSets: tagSets, - // selectFields: sfs.list(), - // selectTags: sts.list(), - // whereFields: wfs.list(), - // }, nil - - // tagSets := tsf.tagSets - // selectFields.add(tsf.selectFields...) - // selectTags.add(tsf.selectTags...) - // whereFields.add(tsf.whereFields...) - - // If we only have tags in our select clause we just return - if len(info.SelectFields) == 0 && len(info.SelectTags) > 0 { - return info, fmt.Errorf("statement must have at least one field in select clause") - } - - // SLIMIT and SOFFSET the unique series - if stmt.SLimit > 0 || stmt.SOffset > 0 { - if stmt.SOffset > len(info.TagSets) { - info.TagSets = nil - } else { - if stmt.SOffset+stmt.SLimit > len(info.TagSets) { - stmt.SLimit = len(info.TagSets) - stmt.SOffset - } - info.TagSets = info.TagSets[stmt.SOffset : stmt.SOffset+stmt.SLimit] - } - } - - return info, nil -} - // SelectFields returns a list of fields in the SELECT section of stmt. func (m *Measurement) SelectFields(stmt *influxql.SelectStatement) []string { set := newStringSet() @@ -1144,7 +1106,6 @@ func (m *Measurement) DimensionTagSets(stmt *influxql.SelectStatement) ([]*influ } type SelectInfo struct { - TagSets []*influxql.TagSet SelectFields []string SelectTags []string WhereFields []string @@ -1157,6 +1118,45 @@ func (a Measurements) Len() int { return len(a) } func (a Measurements) Less(i, j int) bool { return a[i].Name < a[j].Name } func (a Measurements) Swap(i, j int) { a[i], a[j] = a[j], a[i] } +// SelectFields returns a list of fields in the SELECT section of stmt. +func (a Measurements) SelectFields(stmt *influxql.SelectStatement) []string { + set := newStringSet() + for _, name := range stmt.NamesInSelect() { + for _, m := range a { + if m.HasField(name) { + set.add(name) + } + } + } + return set.list() +} + +// SelectTags returns a list of non-field tags in the SELECT section of stmt. +func (a Measurements) SelectTags(stmt *influxql.SelectStatement) []string { + set := newStringSet() + for _, name := range stmt.NamesInSelect() { + for _, m := range a { + if !m.HasField(name) && m.HasTagKey(name) { + set.add(name) + } + } + } + return set.list() +} + +// WhereFields returns a list of non-"time" fields in the WHERE section of stmt. +func (a Measurements) WhereFields(stmt *influxql.SelectStatement) []string { + set := newStringSet() + for _, name := range stmt.NamesInWhere() { + for _, m := range a { + if name != "time" && m.HasField(name) { + set.add(name) + } + } + } + return set.list() +} + func (a Measurements) intersect(other Measurements) Measurements { l := a r := other From 649663ca15221b03a5b085c82e4639e8915c7114 Mon Sep 17 00:00:00 2001 From: Ben Johnson Date: Mon, 21 Sep 2015 15:25:45 -0600 Subject: [PATCH 5/8] fix tests --- cmd/inspect/main.go | 18 +++++-------- tsdb/cursor.go | 63 +++++++++++++++++---------------------------- tsdb/mapper.go | 20 +++++++------- 3 files changed, 39 insertions(+), 62 deletions(-) diff --git a/cmd/inspect/main.go b/cmd/inspect/main.go index eaae2d8913..4144759b44 100644 --- a/cmd/inspect/main.go +++ b/cmd/inspect/main.go @@ -77,8 +77,7 @@ func main() { for _, key := range series { fieldSummary := []string{} - - cursor := tx.Cursor(key, true) + cursor := tx.Cursor(key, m.FieldNames(), shard.FieldCodec(m.Name), true) // Series doesn't exist in this shard if cursor == nil { @@ -86,21 +85,16 @@ func main() { } // Seek to the beginning - _, value := cursor.Seek([]byte{}) - codec := shard.FieldCodec(m.Name) - if codec != nil { - fields, err := codec.DecodeFieldsWithNames(value) - if err != nil { - fmt.Printf("Failed to decode values: %v", err) - } - + _, fields := cursor.Seek(0) + if fields, ok := fields.(map[string]interface{}); ok { for field, value := range fields { fieldSummary = append(fieldSummary, fmt.Sprintf("%s:%T", field, value)) } sort.Strings(fieldSummary) + + fmt.Fprintf(tw, "%d\t%s\t%s\t%d/%d\t%d [%s]\t%d\n", shardID, db, m.Name, len(tags), tagValues, + len(fields), strings.Join(fieldSummary, ","), len(series)) } - fmt.Fprintf(tw, "%d\t%s\t%s\t%d/%d\t%d [%s]\t%d\n", shardID, db, m.Name, len(tags), tagValues, - len(fields), strings.Join(fieldSummary, ","), len(series)) break } tx.Rollback() diff --git a/tsdb/cursor.go b/tsdb/cursor.go index 9e00e37404..7b3369be90 100644 --- a/tsdb/cursor.go +++ b/tsdb/cursor.go @@ -244,6 +244,30 @@ func (tsc *TagSetCursor) Next(tmin, tmax int64) (int64, interface{}) { continue } + // Filter value. + if p.cursor.filter != nil { + // Convert value to a map for filter evaluation. + m, ok := value.(map[string]interface{}) + if !ok { + m = map[string]interface{}{tsc.SelectFields[0]: value} + } + + // If filter fails then skip to the next value. + if !influxql.EvalBool(p.cursor.filter, m) { + continue + } + } + + // Filter out single field, if specified. + if len(tsc.SelectFields) == 1 { + if m, ok := value.(map[string]interface{}); ok { + value = m[tsc.SelectFields[0]] + } + if value == nil { + continue + } + } + return timestamp, value } } @@ -252,45 +276,6 @@ func (tsc *TagSetCursor) Next(tmin, tmax int64) (int64, interface{}) { // if there is no current currsor, it returns nil func (tsc *TagSetCursor) Tags() map[string]string { return tsc.currentTags } -// decodeRawPoint decodes raw point data into field names & values and does WHERE filtering. -// func (tsc *TagSetCursor) decodeRawPoint(p *pointHeapItem) interface{} { -// if len(tsc.SelectFields) > 1 { -// if fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value); err == nil { -// // If there's a where clause, make sure we don't need to filter this value -// if p.cursor.filter != nil && !influxql.EvalBool(p.cursor.filter, fieldsWithNames) { -// return nil -// } - -// return fieldsWithNames -// } -// } - -// // With only 1 field SELECTed, decoding all fields may be avoidable, which is faster. -// value, err := tsc.decoder.DecodeByName(tsc.SelectFields[0], p.value) -// if err != nil { -// return nil -// } - -// // Return value if there's no filter. -// if p.cursor.filter == nil { -// return value -// } - -// // See if the WHERE is only on this field or on one or more other fields. -// // If the latter, we'll have to decode everything -// if len(tsc.WhereFields) == 1 && tsc.WhereFields[0] == tsc.SelectFields[0] { -// if !influxql.EvalBool(p.cursor.filter, map[string]interface{}{tsc.SelectFields[0]: value}) { -// value = nil -// } -// } else { -// fieldsWithNames, err := tsc.decoder.DecodeFieldsWithNames(p.value) -// if err != nil || !influxql.EvalBool(p.cursor.filter, fieldsWithNames) { -// value = nil -// } -// } -// return value -// } - type pointHeapItem struct { timestamp int64 value interface{} diff --git a/tsdb/mapper.go b/tsdb/mapper.go index 7ed0bf5c12..dc0bc00c98 100644 --- a/tsdb/mapper.go +++ b/tsdb/mapper.go @@ -463,7 +463,7 @@ func (m *AggregateMapper) openMeasurement(mm *Measurement) error { cursors := []*TagsCursor{} for i, key := range t.SeriesKeys { - c := m.tx.Cursor(key, selectFields, m.shard.FieldCodec(mm.Name), true) + c := m.tx.Cursor(key, m.fieldNames, m.shard.FieldCodec(mm.Name), true) if c == nil { continue } @@ -603,17 +603,15 @@ func (m *AggregateMapper) NextChunk() (interface{}, error) { tsc.WhereFields = m.whereFields // Execute the map function which walks the entire interval, and aggregates the result. - output.Values[0].Value = append( - output.Values[0].Value.([]interface{}), - m.mapFuncs[i](&AggregateTagSetCursor{ - cursor: tsc, - tmin: tmin, - stmt: m.stmt, + mapValue := m.mapFuncs[i](&AggregateTagSetCursor{ + cursor: tsc, + tmin: tmin, + stmt: m.stmt, - qmin: qmin, - qmax: qmax, - }), - ) + qmin: qmin, + qmax: qmax, + }) + output.Values[0].Value = append(output.Values[0].Value.([]interface{}), mapValue) } return output, nil From 420b8ed3621f952c21401c1c80daee374fd713d5 Mon Sep 17 00:00:00 2001 From: Ben Johnson Date: Mon, 21 Sep 2015 15:25:59 -0600 Subject: [PATCH 6/8] go vet: remove -methods --- .hooks/pre-commit | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/.hooks/pre-commit b/.hooks/pre-commit index a12ccac8ac..ba05e8a294 100755 --- a/.hooks/pre-commit +++ b/.hooks/pre-commit @@ -7,7 +7,7 @@ if [ $fmtcount -gt 0 ]; then fi # Due to the way composites work, vet will fail for some of our tests so we ignore it -vetcount=`go tool vet --composites=false ./ 2>&1 | wc -l` +vetcount=`go tool vet --composites=false --methods=false ./ 2>&1 | wc -l` if [ $vetcount -gt 0 ]; then echo "Some files aren't passing vet heuristics, please run 'go vet ./...' to see the errors it flags and correct your source code before committing" exit 1 From 56cb2fae5daec3c953bbe214b1099262440a5d31 Mon Sep 17 00:00:00 2001 From: Ben Johnson Date: Tue, 22 Sep 2015 12:25:24 -0600 Subject: [PATCH 7/8] fix integration tests --- cmd/influxd/run/server_test.go | 2 ++ tsdb/cursor.go | 16 ++++++++-------- tsdb/mapper.go | 25 ++++++++++++++++++++++--- 3 files changed, 32 insertions(+), 11 deletions(-) diff --git a/cmd/influxd/run/server_test.go b/cmd/influxd/run/server_test.go index 6639f378f0..890ab2de46 100644 --- a/cmd/influxd/run/server_test.go +++ b/cmd/influxd/run/server_test.go @@ -2805,6 +2805,7 @@ func TestServer_Query_Wildcards(t *testing.T) { t.Logf("SKIP:: %s", query.name) continue } + if err := query.Execute(s); err != nil { t.Error(query.Error(err)) } else if !query.success() { @@ -3181,6 +3182,7 @@ func TestServer_Query_Where_Fields(t *testing.T) { t.Logf("SKIP:: %s", query.name) continue } + if err := query.Execute(s); err != nil { t.Error(query.Error(err)) } else if !query.success() { diff --git a/tsdb/cursor.go b/tsdb/cursor.go index 7b3369be90..b70229d029 100644 --- a/tsdb/cursor.go +++ b/tsdb/cursor.go @@ -38,7 +38,7 @@ type multiCursor struct { } // Seek moves the cursor to a given key. -func (mc *multiCursor) Seek(seek int64) (key int64, value interface{}) { +func (mc *multiCursor) Seek(seek int64) (int64, interface{}) { // Initialize heap. h := make(cursorHeap, 0, len(mc.cursors)) for i, c := range mc.cursors { @@ -73,7 +73,7 @@ func (mc *multiCursor) Ascending() bool { } // Next returns the next key/value from the cursor. -func (mc *multiCursor) Next() (key int64, value interface{}) { return mc.pop() } +func (mc *multiCursor) Next() (int64, interface{}) { return mc.pop() } // pop returns the next item from the heap. // Reads the next key/value from item's cursor and puts it back on the heap. @@ -153,8 +153,8 @@ type TagSetCursor struct { cursors []*TagsCursor // Underlying tags cursors. currentTags map[string]string // the current tags for the underlying series cursor in play - SelectFields []string - WhereFields []string + SelectFields []string // fields to be selected + Fields []string // fields to be selected or filtered // Min-heap of cursors ordered by timestamp. heap *pointHeap @@ -336,7 +336,7 @@ func NewTagsCursor(c Cursor, filter influxql.Expr, tags map[string]string) *Tags } // Seek positions returning the key and value at that key. -func (c *TagsCursor) Seek(seek int64) (key int64, value interface{}) { +func (c *TagsCursor) Seek(seek int64) (int64, interface{}) { // We've seeked on this cursor. This seek is after that previous cached seek // and the result it gave was after the key for this seek. // @@ -347,16 +347,16 @@ func (c *TagsCursor) Seek(seek int64) (key int64, value interface{}) { } // Seek to key/value in underlying cursor. - key, value = c.cursor.Seek(seek) + key, value := c.cursor.Seek(seek) // Save the seek to the buffer. c.seek = seek c.buf.key, c.buf.value = key, value - return + return key, value } // Next returns the next timestamp and value from the cursor. -func (c *TagsCursor) Next() (key int64, value interface{}) { +func (c *TagsCursor) Next() (int64, interface{}) { // Invalidate the seek. c.seek = -1 c.buf.key, c.buf.value = 0, nil diff --git a/tsdb/mapper.go b/tsdb/mapper.go index dc0bc00c98..f2306c3fae 100644 --- a/tsdb/mapper.go +++ b/tsdb/mapper.go @@ -215,6 +215,7 @@ func (m *RawMapper) openMeasurement(mm *Measurement) error { // Validate the fields and tags asked for exist and keep track of which are in the select vs the where selectFields := mm.SelectFields(m.stmt) selectTags := mm.SelectTags(m.stmt) + fields := uniqueStrings(m.selectFields, m.whereFields) // If we only have tags in our select clause we just return if len(selectFields) == 0 && len(selectTags) > 0 { @@ -234,7 +235,7 @@ func (m *RawMapper) openMeasurement(mm *Measurement) error { cursors := []*TagsCursor{} for i, key := range t.SeriesKeys { - c := m.tx.Cursor(key, selectFields, m.shard.FieldCodec(mm.Name), ascending) + c := m.tx.Cursor(key, fields, m.shard.FieldCodec(mm.Name), ascending) if c == nil { continue } @@ -246,7 +247,7 @@ func (m *RawMapper) openMeasurement(mm *Measurement) error { tsc := NewTagSetCursor(mm.Name, t.Tags, cursors) tsc.SelectFields = m.selectFields - tsc.WhereFields = m.whereFields + tsc.Fields = fields if ascending { tsc.Init(m.qmin) } else { @@ -600,7 +601,7 @@ func (m *AggregateMapper) NextChunk() (interface{}, error) { } tsc.SelectFields = []string{m.fieldNames[i]} - tsc.WhereFields = m.whereFields + tsc.Fields = uniqueStrings([]string{m.fieldNames[i]}, m.whereFields) // Execute the map function which walks the entire interval, and aggregates the result. mapValue := m.mapFuncs[i](&AggregateTagSetCursor{ @@ -660,3 +661,21 @@ func (a *AggregateTagSetCursor) TMin() int64 { } return -1 } + +// uniqueStrings returns a slice of unique strings from all lists in a. +func uniqueStrings(a ...[]string) []string { + // Calculate unique set of strings. + m := make(map[string]struct{}) + for _, strs := range a { + for _, str := range strs { + m[str] = struct{}{} + } + } + + // Convert back to slice. + result := make([]string, 0, len(m)) + for k := range m { + result = append(result, k) + } + return result +} From 96715d7d9022c792d7623d5616ac7bc4bf322ae0 Mon Sep 17 00:00:00 2001 From: Ben Johnson Date: Tue, 22 Sep 2015 13:20:53 -0600 Subject: [PATCH 8/8] rename Cursor.Seek() to Cursor.SeekTo() --- .hooks/pre-commit | 2 +- CHANGELOG.md | 1 + cmd/inspect/main.go | 2 +- tsdb/cursor.go | 12 +++---- tsdb/cursor_test.go | 16 +++++----- tsdb/engine/b1/b1.go | 2 +- tsdb/engine/b1/b1_test.go | 4 +-- tsdb/engine/bz1/bz1.go | 2 +- tsdb/engine/bz1/bz1_test.go | 63 ++++++++++++++++++------------------- tsdb/engine/wal/wal.go | 2 +- tsdb/engine/wal/wal_test.go | 4 +-- tsdb/mapper.go | 2 +- 12 files changed, 56 insertions(+), 56 deletions(-) diff --git a/.hooks/pre-commit b/.hooks/pre-commit index ba05e8a294..a12ccac8ac 100755 --- a/.hooks/pre-commit +++ b/.hooks/pre-commit @@ -7,7 +7,7 @@ if [ $fmtcount -gt 0 ]; then fi # Due to the way composites work, vet will fail for some of our tests so we ignore it -vetcount=`go tool vet --composites=false --methods=false ./ 2>&1 | wc -l` +vetcount=`go tool vet --composites=false ./ 2>&1 | wc -l` if [ $vetcount -gt 0 ]; then echo "Some files aren't passing vet heuristics, please run 'go vet ./...' to see the errors it flags and correct your source code before committing" exit 1 diff --git a/CHANGELOG.md b/CHANGELOG.md index 97f2a5c787..c187ea223d 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -16,6 +16,7 @@ - [#4165](https://github.com/influxdb/influxdb/pull/4165): Tag all Go runtime stats when writing to internal database. - [#4118](https://github.com/influxdb/influxdb/issues/4118): Return consistent, correct result for SHOW MEASUREMENTS with multiple AND conditions - [#4191](https://github.com/influxdb/influxdb/pull/4191): Correctly marshal remote mapper responses. Fixes [#4170](https://github.com/influxdb/influxdb/issues/4170) +- [#4180](https://github.com/influxdb/influxdb/pull/4180): Cursor & SelectMapper Refactor ## v0.9.4 [2015-09-14] diff --git a/cmd/inspect/main.go b/cmd/inspect/main.go index 4144759b44..f299fee1c9 100644 --- a/cmd/inspect/main.go +++ b/cmd/inspect/main.go @@ -85,7 +85,7 @@ func main() { } // Seek to the beginning - _, fields := cursor.Seek(0) + _, fields := cursor.SeekTo(0) if fields, ok := fields.(map[string]interface{}); ok { for field, value := range fields { fieldSummary = append(fieldSummary, fmt.Sprintf("%s:%T", field, value)) diff --git a/tsdb/cursor.go b/tsdb/cursor.go index b70229d029..e533e7705e 100644 --- a/tsdb/cursor.go +++ b/tsdb/cursor.go @@ -14,7 +14,7 @@ const EOF = int64(-1) // Cursor represents an iterator over a series. type Cursor interface { - Seek(seek int64) (key int64, value interface{}) + SeekTo(seek int64) (key int64, value interface{}) Next() (key int64, value interface{}) Ascending() bool } @@ -38,12 +38,12 @@ type multiCursor struct { } // Seek moves the cursor to a given key. -func (mc *multiCursor) Seek(seek int64) (int64, interface{}) { +func (mc *multiCursor) SeekTo(seek int64) (int64, interface{}) { // Initialize heap. h := make(cursorHeap, 0, len(mc.cursors)) for i, c := range mc.cursors { // Move cursor to position. Skip if it's empty. - k, v := c.Seek(seek) + k, v := c.SeekTo(seek) if k == EOF { continue } @@ -189,7 +189,7 @@ func (tsc *TagSetCursor) Init(seek int64) { // Prime the buffers. for i := 0; i < len(tsc.cursors); i++ { - k, v := tsc.cursors[i].Seek(seek) + k, v := tsc.cursors[i].SeekTo(seek) if k == EOF { k, v = tsc.cursors[i].Next() } @@ -336,7 +336,7 @@ func NewTagsCursor(c Cursor, filter influxql.Expr, tags map[string]string) *Tags } // Seek positions returning the key and value at that key. -func (c *TagsCursor) Seek(seek int64) (int64, interface{}) { +func (c *TagsCursor) SeekTo(seek int64) (int64, interface{}) { // We've seeked on this cursor. This seek is after that previous cached seek // and the result it gave was after the key for this seek. // @@ -347,7 +347,7 @@ func (c *TagsCursor) Seek(seek int64) (int64, interface{}) { } // Seek to key/value in underlying cursor. - key, value := c.cursor.Seek(seek) + key, value := c.cursor.SeekTo(seek) // Save the seek to the buffer. c.seek = seek diff --git a/tsdb/cursor_test.go b/tsdb/cursor_test.go index 55965162e3..b5505f2c4c 100644 --- a/tsdb/cursor_test.go +++ b/tsdb/cursor_test.go @@ -20,7 +20,7 @@ func TestMultiCursor_Single(t *testing.T) { {Key: 2, Value: 20}, }, true)) - if k, v := mc.Seek(0); k != 0 || v.(int) != 0 { + if k, v := mc.SeekTo(0); k != 0 || v.(int) != 0 { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = mc.Next(); k != 1 || v.(int) != 10 { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -39,7 +39,7 @@ func TestMultiCursor_Single_Reverse(t *testing.T) { {Key: 2, Value: 20}, }, false)) - if k, v := mc.Seek(2); k != 2 || v.(int) != 20 { + if k, v := mc.SeekTo(2); k != 2 || v.(int) != 20 { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = mc.Next(); k != 1 || v.(int) != 10 { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -64,7 +64,7 @@ func TestMultiCursor_Multiple_NonOverlapping(t *testing.T) { }, true), ) - if k, v := mc.Seek(0); k != 0 || v.(int) != 0 { + if k, v := mc.SeekTo(0); k != 0 || v.(int) != 0 { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = mc.Next(); k != 1 || v.(int) != 10 { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -93,7 +93,7 @@ func TestMultiCursor_Multiple_NonOverlapping_Reverse(t *testing.T) { }, false), ) - if k, v := mc.Seek(4); k != 4 || v.(int) != 40 { + if k, v := mc.SeekTo(4); k != 4 || v.(int) != 40 { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = mc.Next(); k != 3 || v.(int) != 30 { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -123,7 +123,7 @@ func TestMultiCursor_Multiple_Overlapping(t *testing.T) { }, true), ) - if k, v := mc.Seek(0); k != 0 || v.(int) != 0 { + if k, v := mc.SeekTo(0); k != 0 || v.(int) != 0 { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = mc.Next(); k != 2 || v.(int) != 0xF2 { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -151,7 +151,7 @@ func TestMultiCursor_Multiple_Overlapping_Reverse(t *testing.T) { }, false), ) - if k, v := mc.Seek(4); k != 4 || v.(int) != 4 { + if k, v := mc.SeekTo(4); k != 4 || v.(int) != 4 { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = mc.Next(); k != 3 || v.(int) != 3 { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -193,7 +193,7 @@ func TestMultiCursor_Quick(t *testing.T) { // Create multi-cursor and iterate over all items. mc := tsdb.MultiCursor(tsdbCursorSlice(cursors)...) - for k, v := mc.Seek(seek); k != tsdb.EOF; k, v = mc.Next() { + for k, v := mc.SeekTo(seek); k != tsdb.EOF; k, v = mc.Next() { got = append(got, CursorItem{k, v.(int)}) } @@ -231,7 +231,7 @@ func NewCursor(items []CursorItem, ascending bool) *Cursor { func (c *Cursor) Ascending() bool { return c.ascending } // Seek seeks to an item by key. -func (c *Cursor) Seek(seek int64) (key int64, value interface{}) { +func (c *Cursor) SeekTo(seek int64) (key int64, value interface{}) { if c.ascending { return c.seekForward(seek) } diff --git a/tsdb/engine/b1/b1.go b/tsdb/engine/b1/b1.go index f8f6fb65bf..fdc337b2f7 100644 --- a/tsdb/engine/b1/b1.go +++ b/tsdb/engine/b1/b1.go @@ -615,7 +615,7 @@ type Cursor struct { func (c *Cursor) Ascending() bool { return c.ascending } // Seek moves the cursor to a position and returns the closest key/value pair. -func (c *Cursor) Seek(seek int64) (key int64, value interface{}) { +func (c *Cursor) SeekTo(seek int64) (key int64, value interface{}) { // Seek bolt cursor. seekBytes := u64tob(uint64(seek)) if c.cursor != nil { diff --git a/tsdb/engine/b1/b1_test.go b/tsdb/engine/b1/b1_test.go index 085f55ea75..5c3c19ee3b 100644 --- a/tsdb/engine/b1/b1_test.go +++ b/tsdb/engine/b1/b1_test.go @@ -66,7 +66,7 @@ func TestEngine_WritePoints(t *testing.T) { defer tx.Rollback() c := tx.Cursor("temperature", []string{"value"}, mf.Codec, true) - if k, v := c.Seek(0); k != 1434059627000000000 { + if k, v := c.SeekTo(0); k != 1434059627000000000 { t.Fatalf("unexpected key: %#v", k) } else if v == nil || v.(float64) != 200 { t.Errorf("unexpected value: %#v", v) @@ -129,7 +129,7 @@ func TestEngine_WritePoints_Reverse(t *testing.T) { defer tx.Rollback() c := tx.Cursor("temperature", []string{"value"}, mf.Codec, false) - if k, _ := c.Seek(math.MaxInt64); k != time.Unix(1, 0).UnixNano() { + if k, _ := c.SeekTo(math.MaxInt64); k != time.Unix(1, 0).UnixNano() { t.Fatalf("unexpected key: %v", k) } else if k, v := c.Next(); k != time.Unix(0, 0).UnixNano() { t.Fatalf("unexpected key: %v", k) diff --git a/tsdb/engine/bz1/bz1.go b/tsdb/engine/bz1/bz1.go index ba565ecef1..e4d5682ca4 100644 --- a/tsdb/engine/bz1/bz1.go +++ b/tsdb/engine/bz1/bz1.go @@ -667,7 +667,7 @@ func (c *Cursor) last() { func (c *Cursor) Ascending() bool { return c.ascending } // Seek moves the cursor to a position and returns the closest key/value pair. -func (c *Cursor) Seek(seek int64) (key int64, value interface{}) { +func (c *Cursor) SeekTo(seek int64) (key int64, value interface{}) { seekBytes := u64tob(uint64(seek)) // Move cursor to appropriate block and set to buffer. diff --git a/tsdb/engine/bz1/bz1_test.go b/tsdb/engine/bz1/bz1_test.go index b2c528ab99..97873afe3b 100644 --- a/tsdb/engine/bz1/bz1_test.go +++ b/tsdb/engine/bz1/bz1_test.go @@ -16,7 +16,6 @@ import ( "github.com/influxdb/influxdb/models" "github.com/influxdb/influxdb/tsdb" "github.com/influxdb/influxdb/tsdb/engine/bz1" - //"github.com/influxdb/influxdb/tsdb/engine/wal" ) // Ensure the engine can write series metadata and reload it. @@ -152,11 +151,11 @@ func TestEngine_WriteIndex_Append(t *testing.T) { // Append points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(1), MustEncodeFields(codec, tsdb.Fields{"value": float64(10)})...), - append(u64tob(2), MustEncodeFields(codec, tsdb.Fields{"value": float64(20)})...), + append(u64tob(1), MustEncodeFields(codec, models.Fields{"value": float64(10)})...), + append(u64tob(2), MustEncodeFields(codec, models.Fields{"value": float64(20)})...), }, "mem": [][]byte{ - append(u64tob(0), MustEncodeFields(codec, tsdb.Fields{"value": float64(30)})...), + append(u64tob(0), MustEncodeFields(codec, models.Fields{"value": float64(30)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -168,7 +167,7 @@ func TestEngine_WriteIndex_Append(t *testing.T) { // Iterate over "cpu" series. c := tx.Cursor("cpu", []string{"value"}, codec, true) - if k, v := c.Seek(0); k != 1 || v.(float64) != float64(10) { + if k, v := c.SeekTo(0); k != 1 || v.(float64) != float64(10) { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = c.Next(); k != 2 || v.(float64) != float64(20) { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -178,7 +177,7 @@ func TestEngine_WriteIndex_Append(t *testing.T) { // Iterate over "mem" series. c = tx.Cursor("mem", []string{"value"}, codec, true) - if k, v := c.Seek(0); k != 0 || v.(float64) != float64(30) { + if k, v := c.SeekTo(0); k != 0 || v.(float64) != float64(30) { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, _ = c.Next(); k != tsdb.EOF { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -198,9 +197,9 @@ func TestEngine_WriteIndex_Insert(t *testing.T) { // Write initial points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": float64(10)})...), - append(u64tob(20), MustEncodeFields(codec, tsdb.Fields{"value": float64(20)})...), - append(u64tob(30), MustEncodeFields(codec, tsdb.Fields{"value": float64(30)})...), + append(u64tob(10), MustEncodeFields(codec, models.Fields{"value": float64(10)})...), + append(u64tob(20), MustEncodeFields(codec, models.Fields{"value": float64(20)})...), + append(u64tob(30), MustEncodeFields(codec, models.Fields{"value": float64(30)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -209,10 +208,10 @@ func TestEngine_WriteIndex_Insert(t *testing.T) { // Write overlapping points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(9), MustEncodeFields(codec, tsdb.Fields{"value": float64(9)})...), - append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": float64(255)})...), - append(u64tob(25), MustEncodeFields(codec, tsdb.Fields{"value": float64(25)})...), - append(u64tob(31), MustEncodeFields(codec, tsdb.Fields{"value": float64(31)})...), + append(u64tob(9), MustEncodeFields(codec, models.Fields{"value": float64(9)})...), + append(u64tob(10), MustEncodeFields(codec, models.Fields{"value": float64(255)})...), + append(u64tob(25), MustEncodeFields(codec, models.Fields{"value": float64(25)})...), + append(u64tob(31), MustEncodeFields(codec, models.Fields{"value": float64(31)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -221,7 +220,7 @@ func TestEngine_WriteIndex_Insert(t *testing.T) { // Write overlapping points to index again. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(31), MustEncodeFields(codec, tsdb.Fields{"value": float64(255)})...), + append(u64tob(31), MustEncodeFields(codec, models.Fields{"value": float64(255)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -233,7 +232,7 @@ func TestEngine_WriteIndex_Insert(t *testing.T) { // Iterate over "cpu" series. c := tx.Cursor("cpu", []string{"value"}, codec, true) - if k, v := c.Seek(0); k != 9 || v.(float64) != float64(9) { + if k, v := c.SeekTo(0); k != 9 || v.(float64) != float64(9) { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = c.Next(); k != 10 || v.(float64) != float64(255) { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -261,9 +260,9 @@ func TestEngine_Cursor_Reverse(t *testing.T) { // Write initial points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": float64(10)})...), - append(u64tob(20), MustEncodeFields(codec, tsdb.Fields{"value": float64(20)})...), - append(u64tob(30), MustEncodeFields(codec, tsdb.Fields{"value": float64(30)})...), + append(u64tob(10), MustEncodeFields(codec, models.Fields{"value": float64(10)})...), + append(u64tob(20), MustEncodeFields(codec, models.Fields{"value": float64(20)})...), + append(u64tob(30), MustEncodeFields(codec, models.Fields{"value": float64(30)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -272,10 +271,10 @@ func TestEngine_Cursor_Reverse(t *testing.T) { // Write overlapping points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(9), MustEncodeFields(codec, tsdb.Fields{"value": float64(9)})...), - append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": float64(255)})...), - append(u64tob(25), MustEncodeFields(codec, tsdb.Fields{"value": float64(25)})...), - append(u64tob(31), MustEncodeFields(codec, tsdb.Fields{"value": float64(31)})...), + append(u64tob(9), MustEncodeFields(codec, models.Fields{"value": float64(9)})...), + append(u64tob(10), MustEncodeFields(codec, models.Fields{"value": float64(255)})...), + append(u64tob(25), MustEncodeFields(codec, models.Fields{"value": float64(25)})...), + append(u64tob(31), MustEncodeFields(codec, models.Fields{"value": float64(31)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -284,7 +283,7 @@ func TestEngine_Cursor_Reverse(t *testing.T) { // Write overlapping points to index again. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(31), MustEncodeFields(codec, tsdb.Fields{"value": float64(255)})...), + append(u64tob(31), MustEncodeFields(codec, models.Fields{"value": float64(255)})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -296,7 +295,7 @@ func TestEngine_Cursor_Reverse(t *testing.T) { // Iterate over "cpu" series. c := tx.Cursor("cpu", []string{"value"}, codec, false) - if k, v := c.Seek(math.MaxInt64); k != 31 || v.(float64) != float64(255) { + if k, v := c.SeekTo(math.MaxInt64); k != 31 || v.(float64) != float64(255) { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = c.Next(); k != 30 || v.(float64) != float64(30) { t.Fatalf("unexpected key/value: %x / %x", k, v) @@ -306,7 +305,7 @@ func TestEngine_Cursor_Reverse(t *testing.T) { t.Fatalf("unexpected key/value: %x / %x", k, v) } else if k, v = c.Next(); k != 10 || v.(float64) != float64(255) { t.Fatalf("unexpected key/value: %x / %x", k, v) - } else if k, v = c.Seek(0); k != 9 || v.(float64) != float64(9) { + } else if k, v = c.SeekTo(0); k != 9 || v.(float64) != float64(9) { t.Fatalf("unexpected key/value: %x / %x", k, v) } } @@ -328,10 +327,10 @@ func TestEngine_WriteIndex_SeekAgainstInBlockValue(t *testing.T) { // Write initial points to index. if err := e.WriteIndex(map[string][][]byte{ "cpu": [][]byte{ - append(u64tob(10), MustEncodeFields(codec, tsdb.Fields{"value": data})...), - append(u64tob(20), MustEncodeFields(codec, tsdb.Fields{"value": data})...), - append(u64tob(30), MustEncodeFields(codec, tsdb.Fields{"value": data})...), - append(u64tob(40), MustEncodeFields(codec, tsdb.Fields{"value": data})...), + append(u64tob(10), MustEncodeFields(codec, models.Fields{"value": data})...), + append(u64tob(20), MustEncodeFields(codec, models.Fields{"value": data})...), + append(u64tob(30), MustEncodeFields(codec, models.Fields{"value": data})...), + append(u64tob(40), MustEncodeFields(codec, models.Fields{"value": data})...), }, }, nil, nil); err != nil { t.Fatal(err) @@ -343,11 +342,11 @@ func TestEngine_WriteIndex_SeekAgainstInBlockValue(t *testing.T) { // Ensure that we can seek to a block in the middle c := tx.Cursor("cpu", []string{"value"}, codec, true) - if k, _ := c.Seek(15); k != 20 { + if k, _ := c.SeekTo(15); k != 20 { t.Fatalf("expected to seek to time 20, but got %d", k) } // Ensure that we can seek to the block on the end - if k, _ := c.Seek(35); k != 40 { + if k, _ := c.SeekTo(35); k != 40 { t.Fatalf("expected to seek to time 40, but got %d", k) } } @@ -452,7 +451,7 @@ type Cursor struct { func (c *Cursor) Ascending() bool { return c.ascending } -func (c *Cursor) Seek(key int64) (int64, interface{}) { return tsdb.EOF, nil } +func (c *Cursor) SeekTo(key int64) (int64, interface{}) { return tsdb.EOF, nil } func (c *Cursor) Next() (int64, interface{}) { return tsdb.EOF, nil } diff --git a/tsdb/engine/wal/wal.go b/tsdb/engine/wal/wal.go index 11ba0136e1..0bec6c2a39 100644 --- a/tsdb/engine/wal/wal.go +++ b/tsdb/engine/wal/wal.go @@ -1433,7 +1433,7 @@ func newCursor(cache [][]byte, fields []string, dec *tsdb.FieldCodec, ascending func (c *cursor) Ascending() bool { return c.ascending } // Seek will point the cursor to the given time (or key) -func (c *cursor) Seek(seek int64) (key int64, value interface{}) { +func (c *cursor) SeekTo(seek int64) (key int64, value interface{}) { seekBytes := u64tob(uint64(seek)) // Seek cache index diff --git a/tsdb/engine/wal/wal_test.go b/tsdb/engine/wal/wal_test.go index 4905fe1fad..9c425782ff 100644 --- a/tsdb/engine/wal/wal_test.go +++ b/tsdb/engine/wal/wal_test.go @@ -41,7 +41,7 @@ func TestWAL_WritePoints(t *testing.T) { } c := log.Cursor("cpu,host=A", []string{"value"}, codec, true) - k, v := c.Seek(1) + k, v := c.SeekTo(1) // ensure the series are there and points are in order if v.(float64) != 23.2 { @@ -602,7 +602,7 @@ func TestWAL_QueryDuringCompaction(t *testing.T) { verify := func() { c := log.Cursor("cpu,host=A", []string{"value"}, codec, true) - k, v := c.Seek(1) + k, v := c.SeekTo(1) // ensure the series are there and points are in order if v.(float64) != 23.2 { <-finishCompaction diff --git a/tsdb/mapper.go b/tsdb/mapper.go index f2306c3fae..84cc2e63f7 100644 --- a/tsdb/mapper.go +++ b/tsdb/mapper.go @@ -588,7 +588,7 @@ func (m *AggregateMapper) NextChunk() (interface{}, error) { // changes to the mapper functions, which can come later. // Prime the buffers. for i := 0; i < len(tsc.cursors); i++ { - k, v := tsc.cursors[i].Seek(qmin) + k, v := tsc.cursors[i].SeekTo(qmin) if k == -1 || k > tmax { continue }