influxdb/shard.go

package influxdb

import (
	"bytes"
	"encoding/binary"
	"errors"
	"fmt"
	"math"
	"time"

	"code.google.com/p/goprotobuf/proto"
	"code.google.com/p/log4go"
	"github.com/boltdb/bolt"
	"github.com/influxdb/influxdb/engine"
	"github.com/influxdb/influxdb/parser"
	"github.com/influxdb/influxdb/protocol"
)

// Shard represents the physical storage for a given time range.
type Shard struct {
	ID        uint64    `json:"id,omitempty"`
	StartTime time.Time `json:"startTime,omitempty"`
	EndTime   time.Time `json:"endTime,omitempty"`

	store *bolt.DB
}

// newShard returns a new initialized Shard instance.
func newShard() *Shard { return &Shard{} }

// Duration returns the duration between the shard's start and end time.
func (s *Shard) Duration() time.Duration { return s.EndTime.Sub(s.StartTime) }

// open initializes and opens the shard's store.
func (s *Shard) open(path string) error {
	// Return an error if the shard is already open.
	if s.store != nil {
		return errors.New("shard already open")
	}

	// Open store on shard.
	store, err := bolt.Open(path, 0600, &bolt.Options{Timeout: 1 * time.Second})
	if err != nil {
		return err
	}
	s.store = store

	// Initialize store.
	if err := s.init(); err != nil {
		_ = s.close()
		return fmt.Errorf("init: %s", err)
	}

	return nil
}

// init creates top-level buckets in the datastore.
func (s *Shard) init() error {
	return s.store.Update(func(tx *bolt.Tx) error {
		_, _ = tx.CreateBucketIfNotExists([]byte("values"))
		return nil
	})
}

// close shuts down the shard's store.
func (s *Shard) close() error {
	return s.store.Close()
}

// write writes series data to a shard.
func (s *Shard) writeSeries(series *protocol.Series) error {
	assert(len(series.GetFieldIds()) > 0, "field ids required for write")

	return s.store.Update(func(tx *bolt.Tx) error {
		b := tx.Bucket([]byte("values"))

		for i, fieldID := range series.FieldIds {
			for _, p := range series.Points {
				// Convert the storage key to a byte slice.
				k := marshalStorageKey(newStorageKey(fieldID, p.GetTimestamp(), p.GetSequenceNumber()))

				// If value is null then delete it.
				if p.Values[i].GetIsNull() {
					if err := b.Delete(k); err != nil {
						return fmt.Errorf("del: %s", err)
					}
					continue
				}

				// Marshal the value via protobuf.
				buf := proto.NewBuffer(nil)
				if err := buf.Marshal(p.Values[i]); err != nil {
					return err
				}

				// Write to the bucket.
				if err := b.Put(k, buf.Bytes()); err != nil {
					return fmt.Errorf("put: %s", err)
				}
			}
		}

		return nil
	})
}

func (s *Shard) deleteSeries(name string) error {
	panic("not yet implemented") // TODO
}

// query executes a query against the shard and returns results to a channel.
func (s *Shard) query(spec *parser.QuerySpec, name string, fields []*Field, resp chan<- *protocol.Response) {
	log4go.Debug("QUERY: shard %d, query '%s'", s.ID, spec.GetQueryStringWithTimeCondition())
	defer recoverFunc(spec.Database(), spec.GetQueryStringWithTimeCondition(), func(err interface{}) {
		resp <- &protocol.Response{
			Type:         protocol.Response_ERROR.Enum(),
			ErrorMessage: protocol.String(fmt.Sprintf("%s", err)),
		}
	})

	var err error
	var p engine.Processor
	p = NewResponseChannelProcessor(NewResponseChannelWrapper(resp))
	p = NewShardIdInserterProcessor(s.ID, p)

	if p, err = s.processor(spec, p); err != nil {
		resp <- &protocol.Response{
			Type:         protocol.Response_ERROR.Enum(),
			ErrorMessage: protocol.String(err.Error()),
		}
		log4go.Error("error while creating engine: %s", err)
		return
	}
	log4go.Info("processor chain:  %s\n", engine.ProcessorChain(p))

	// Execute by type of query.
	switch t := spec.SelectQuery().FromClause.Type; t {
	case parser.FromClauseArray:
		log4go.Debug("shard %s: running a regular query")
		err = s.executeArrayQuery(spec, name, fields, p)

	// TODO
	//case parser.FromClauseMerge, parser.FromClauseInnerJoin:
	//	log4go.Debug("shard %s: running a merge query")
	//	err = s.executeMergeQuery(querySpec, processor, t)

	default:
		panic(fmt.Errorf("unknown from clause type %s", t))
	}
	if err != nil {
		resp <- &protocol.Response{
			Type:         protocol.Response_ERROR.Enum(),
			ErrorMessage: protocol.String(err.Error()),
		}
		return
	}

	_ = p.Close()
	resp <- &protocol.Response{Type: protocol.Response_END_STREAM.Enum()}
}

func (s *Shard) processor(spec *parser.QuerySpec, p engine.Processor) (engine.Processor, error) {
	// We should aggregate at the shard level.
	q := spec.SelectQuery()
	if spec.CanAggregateLocally(s.Duration()) {
		log4go.Debug("creating a query engine")
		var err error
		if p, err = engine.NewQueryEngine(p, q, nil); err != nil {
			return nil, err
		}
		if q != nil && q.GetFromClause().Type != parser.FromClauseInnerJoin {
			p = engine.NewFilteringEngine(q, p)
		}
		return p, nil
	}

	// We shouldn't limit the queries if they have aggregates and aren't
	// aggregated locally, otherwise the aggregation result which happen
	// in the coordinator will get partial data and will be incorrect
	if q.HasAggregates() {
		log4go.Debug("creating a passthrough engine")
		p = engine.NewPassthroughEngine(p, 1000)
		if q != nil && q.GetFromClause().Type != parser.FromClauseInnerJoin {
			p = engine.NewFilteringEngine(q, p)
		}
		return p, nil
	}

	// This is an optimization so we don't send more data that we should
	// over the wire. The coordinator has its own Passthrough which does
	// the final limit.
	if q.Limit > 0 {
		log4go.Debug("creating a passthrough engine with limit")
		p = engine.NewPassthroughEngineWithLimit(p, 1000, q.Limit)
	}

	return p, nil
}

func (s *Shard) executeArrayQuery(spec *parser.QuerySpec, name string, fields []*Field, processor engine.Processor) error {
	fnames := Fields(fields).Names()
	aliases := spec.SelectQuery().GetTableAliases(name)

	// Create a new iterator.
	i, err := s.iterator(fields)
	if err != nil {
		return fmt.Errorf("iterator: %s", err)
	}
	defer func() { _ = i.close() }()

	i.startTime = spec.GetStartTime()
	i.endTime = spec.GetEndTime()
	i.ascending = spec.SelectQuery().Ascending

	// Iterate over each point and yield to the processor for each alias.
	for p := i.first(); p != nil; p = i.next() {
		for _, alias := range aliases {
			series := &protocol.Series{
				Name:   proto.String(alias),
				Fields: fnames,
				Points: []*protocol.Point{p},
			}

			log4go.Debug("Yielding to %s %s", processor.Name(), series)
			if ok, err := processor.Yield(series); err != nil {
				log4go.Error("Error while processing data: %v", err)
				return err
			} else if !ok {
				log4go.Debug("Stopping processing.")
				// NOTE: This doesn't stop processing.
			}
		}
	}

	log4go.Debug("Finished running query %s", spec.GetQueryString())
	return nil
}

// iterator returns a new iterator for a set of fields.
func (s *Shard) iterator(fields []*Field) (*iterator, error) {
	// Open a read-only transaction.
	// This transaction must be closed separately by the iterator.
	tx, err := s.store.Begin(false)
	if err != nil {
		return nil, err
	}

	// Initialize cursor.
	i := &iterator{
		tx:      tx,
		fields:  fields,
		cursors: make([]*bolt.Cursor, len(fields)),
		values:  make([]rawValue, len(fields)),
	}

	// Open a cursor for each field.
	for j := range fields {
		i.cursors[j] = tx.Bucket([]byte("values")).Cursor()
	}

	return i, nil
}

// Shards represents a list of shards.
type Shards []*Shard

// IDs returns a slice of all shard ids.
func (p Shards) IDs() []uint64 {
	ids := make([]uint64, len(p))
	for i, s := range p {
		ids[i] = s.ID
	}
	return ids
}

// shardsAsc represents a list of shards, sortable in ascending order.
type shardsAsc []*Shard

func (p shardsAsc) Len() int           { return len(p) }
func (p shardsAsc) Less(i, j int) bool { return !p[i].StartTime.Before(p[j].StartTime) }
func (p shardsAsc) Swap(i, j int)      { p[i], p[j] = p[j], p[i] }

// shardsDesc represents a list of shards, sortable in descending order.
type shardsDesc []*Shard

func (p shardsDesc) Len() int           { return len(p) }
func (p shardsDesc) Less(i, j int) bool { return p[i].StartTime.Before(p[j].StartTime) }
func (p shardsDesc) Swap(i, j int)      { p[i], p[j] = p[j], p[i] }

// storageKey is the key that we use to store values in our key/value
// store engine. The key contains the field id, timestamp and sequence
// number of the value being stored.
type storageKey struct {
	bytesBuf  []byte
	id        uint64
	timestamp int64
	seq       uint64
}

// Create a new storageKey.
//    timestamp: the timestamp in microseconds. timestamp can be negative.
func newStorageKey(id uint64, timestamp int64, seq uint64) storageKey {
	return storageKey{
		bytesBuf:  nil,
		id:        id,
		timestamp: timestamp,
		seq:       seq,
	}
}

// Parse the given byte slice into a storageKey
func unmarshalStorageKey(b []byte) (storageKey, error) {
	if len(b) != 8*3 {
		return storageKey{}, fmt.Errorf("Expected %d fields, found %d", 8*3, len(b))
	}

	sk := storageKey{}
	buf := bytes.NewBuffer(b)
	binary.Read(buf, binary.BigEndian, &sk.id)
	var t uint64
	binary.Read(buf, binary.BigEndian, &t)
	sk.timestamp = convertUintTimestampToInt64(t)
	binary.Read(buf, binary.BigEndian, &sk.seq)
	sk.bytesBuf = b
	return sk, nil
}

// mustUnmarshalStorageKey parses a storage key and panics if cannot be parsed.
func mustUnmarshalStorageKey(b []byte) storageKey {
	sk, err := unmarshalStorageKey(b)
	if err != nil {
		panic(err)
	}
	return sk
}

// marshalStorageKey converts a storage key to a byte slice.
// Byte slice is cached for reuse.
func marshalStorageKey(sk storageKey) []byte {
	if sk.bytesBuf != nil {
		return sk.bytesBuf
	}

	buf := bytes.NewBuffer(nil)
	binary.Write(buf, binary.BigEndian, sk.id)
	binary.Write(buf, binary.BigEndian, convertTimestampToUint(sk.timestamp))
	binary.Write(buf, binary.BigEndian, sk.seq)

	// Cache key on the storage key.
	sk.bytesBuf = buf.Bytes()
	return sk.bytesBuf
}

func (sk storageKey) time() time.Time {
	return time.Unix(0, sk.timestamp*int64(time.Microsecond))
}

func convertTimestampToUint(t int64) uint64 {
	if t < 0 {
		return uint64(math.MaxInt64 + t + 1)
	}
	return uint64(t) + uint64(math.MaxInt64) + uint64(1)
}

func convertUintTimestampToInt64(t uint64) int64 {
	if t > uint64(math.MaxInt64) {
		return int64(t-math.MaxInt64) - int64(1)
	}
	return int64(t) - math.MaxInt64 - int64(1)
}

// iterator takes a slice of iterators and their corresponding
// fields and turn it into a point iterator, i.e. an iterator that
// yields whole points instead of column values.
type iterator struct {
	tx      *bolt.Tx
	cursors []*bolt.Cursor

	fields []*Field
	values []rawValue

	startTime time.Time
	endTime   time.Time
	ascending bool

	valid bool
	err   error

	point *protocol.Point
}

// close closes the read transaction and clears the cursors.
func (i *iterator) close() (err error) {
	err = i.tx.Rollback()
	i.tx = nil
	i.cursors = nil
	return
}

// first moves the iterator to the first point.
func (i *iterator) first() *protocol.Point {
	i.valid = false

	for j, c := range i.cursors {
		// Read next key/value.
		k, v := c.Seek(marshalStorageKey(newStorageKey(i.fields[j].ID, convertUintTimestampToInt64(uint64(i.startTime.UnixNano())), 0)))
		if k == nil {
			continue
		}

		sk := mustUnmarshalStorageKey(k)
		if sk.id != i.fields[j].ID {
			log4go.Debug("first: different id reached")
			continue
		} else if sk.time().Before(i.startTime) || sk.time().After(i.endTime) {
			log4go.Debug("first: outside time range: %s, %s", sk.time(), i.startTime)
			continue
		}

		// Set the value for the field.
		i.values[j] = rawValue{time: sk.timestamp, sequence: sk.seq, value: v}
	}

	return i.materialize()
}

// next moves the cursor to the next point.
func (i *iterator) next() *protocol.Point {
	i.valid = false

	// Move the cursors to the next value.
	for j, c := range i.cursors {
		// Ignore cursors which already have a value.
		if i.values[j].value != nil {
			continue
		}

		// Read next key/value.
		k, v := c.Next()
		if k == nil {
			continue
		}

		// Move to the next iterator if different field reached.
		// Move to the next iterator if outside of time range.
		sk := mustUnmarshalStorageKey(k)
		if sk.id != i.fields[j].ID {
			log4go.Debug("different id reached")
			continue
		} else if sk.time().Before(i.startTime) || sk.time().After(i.endTime) {
			log4go.Debug("Outside time range: %s, %s", sk.time(), i.startTime)
			continue
		}

		// Set the value for the field.
		i.values[j] = rawValue{time: sk.timestamp, sequence: sk.seq, value: v}
		log4go.Debug("Iterator next value: %v", i.values[j])
	}

	return i.materialize()
}

// materialize creates a point from the current values and move the cursors forward.
func (i *iterator) materialize() *protocol.Point {
	// choose the highest (or lowest in case of ascending queries) timestamp
	// and sequence number. that will become the timestamp and sequence of
	// the next point.
	var next *rawValue
	for j, value := range i.values {
		// Ignore nil values.
		if value.value == nil {
			continue
		}

		// Initialize next value if not set.
		// Otherwise override next if value is before (ASC) or after (DESC).
		if next == nil {
			next = &i.values[j]
		} else if i.ascending && value.before(next) {
			next = &i.values[j]
		} else if !i.ascending && value.after(next) {
			next = &i.values[j]
		}
	}

	// Set values to point that match the timestamp & sequence number.
	buf := proto.NewBuffer(nil)
	point := &protocol.Point{Values: make([]*protocol.FieldValue, len(i.fields))}
	for j, c := range i.cursors {
		value := &i.values[j]
		log4go.Debug("Column value: %s", value)

		// Skip value if it doesn't match point's timestamp and seq number.
		if value.value == nil || value.time != next.time || value.sequence != next.sequence {
			trueValue := true
			point.Values[j] = &protocol.FieldValue{IsNull: &trueValue}
			continue
		}

		// Iterator is valid if at least one column is set.
		log4go.Debug("Setting is valid to true")
		i.valid = true

		// Advance the iterator to read a new value in the next iteration
		if i.ascending {
			c.Next()
		} else {
			c.Prev()
		}

		// Marshal value from protobufs into point.
		fv := &protocol.FieldValue{}
		buf.SetBuf(value.value)
		if err := buf.Unmarshal(fv); err != nil {
			log4go.Error("Error while running query: %s", err)
			i.err, i.valid = err, false
			return nil
		}
		point.Values[j] = fv
		value.value = nil
	}

	// This will only happen if there are no points for the given series
	// and range and this is the first call to Next(). Otherwise we
	// always call Next() on a valid iterator so we know we have
	// more points
	if next == nil {
		return nil
	}

	// Set timestamp and sequence number on point.
	point.SetTimestampInMicroseconds(next.time)
	point.SequenceNumber = proto.Uint64(next.sequence)

	return point
}

// rawValue represents the value for a field at a given time and sequence id.
type rawValue struct {
	time     int64
	sequence uint64
	value    []byte
}

// before returns true if the value is before another value.
func (v rawValue) before(other *rawValue) bool {
	return (v.time < other.time) || (v.time == other.time && v.sequence < other.sequence)
}

// after returns true if the value is after another value.
func (v rawValue) after(other *rawValue) bool {
	return (v.time > other.time) || (v.time == other.time && v.sequence > other.sequence)
}

func (v rawValue) String() string {
	return fmt.Sprintf("[time: %d, sequence: %d, value: %v]", v.time, v.sequence, v.value)
}
Intermediate commit. 2014-11-04 04:15:58 +00:00			`package influxdb`

			`import (`
			`"bytes"`
			`"encoding/binary"`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`"errors"`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`"fmt"`
			`"math"`
			`"time"`

			`"code.google.com/p/goprotobuf/proto"`
			`"code.google.com/p/log4go"`
			`"github.com/boltdb/bolt"`
			`"github.com/influxdb/influxdb/engine"`
			`"github.com/influxdb/influxdb/parser"`
			`"github.com/influxdb/influxdb/protocol"`
			`)`

Integrating query into shards. 2014-11-06 06:03:35 +00:00			`// Shard represents the physical storage for a given time range.`
			`type Shard struct {`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			ID uint64 `json:"id,omitempty"`
Integrating query into shards. 2014-11-06 06:03:35 +00:00			StartTime time.Time `json:"startTime,omitempty"`
			EndTime time.Time `json:"endTime,omitempty"`

Intermediate commit. 2014-11-04 04:15:58 +00:00			`store *bolt.DB`
			`}`

Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`// newShard returns a new initialized Shard instance.`
			`func newShard() *Shard { return &Shard{} }`

Integrating query into shards. 2014-11-06 06:03:35 +00:00			`// Duration returns the duration between the shard's start and end time.`
			`func (s *Shard) Duration() time.Duration { return s.EndTime.Sub(s.StartTime) }`

Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`// open initializes and opens the shard's store.`
			`func (s *Shard) open(path string) error {`
			`// Return an error if the shard is already open.`
			`if s.store != nil {`
			`return errors.New("shard already open")`
			`}`

			`// Open store on shard.`
			`store, err := bolt.Open(path, 0600, &bolt.Options{Timeout: 1 * time.Second})`
			`if err != nil {`
			`return err`
			`}`
			`s.store = store`

			`// Initialize store.`
			`if err := s.init(); err != nil {`
			`_ = s.close()`
			`return fmt.Errorf("init: %s", err)`
			`}`

			`return nil`
			`}`

			`// init creates top-level buckets in the datastore.`
			`func (s *Shard) init() error {`
			`return s.store.Update(func(tx *bolt.Tx) error {`
			`_, _ = tx.CreateBucketIfNotExists([]byte("values"))`
			`return nil`
			`})`
			`}`

			`// close shuts down the shard's store.`
			`func (s *Shard) close() error {`
			`return s.store.Close()`
			`}`

Intermediate commit. 2014-11-04 04:15:58 +00:00			`// write writes series data to a shard.`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`func (s Shard) writeSeries(series protocol.Series) error {`
			`assert(len(series.GetFieldIds()) > 0, "field ids required for write")`

Intermediate commit. 2014-11-04 04:15:58 +00:00			`return s.store.Update(func(tx *bolt.Tx) error {`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`b := tx.Bucket([]byte("values"))`

			`for i, fieldID := range series.FieldIds {`
			`for _, p := range series.Points {`
			`// Convert the storage key to a byte slice.`
			`k := marshalStorageKey(newStorageKey(fieldID, p.GetTimestamp(), p.GetSequenceNumber()))`

			`// If value is null then delete it.`
			`if p.Values[i].GetIsNull() {`
			`if err := b.Delete(k); err != nil {`
			`return fmt.Errorf("del: %s", err)`
			`}`
			`continue`
			`}`

			`// Marshal the value via protobuf.`
			`buf := proto.NewBuffer(nil)`
			`if err := buf.Marshal(p.Values[i]); err != nil {`
			`return err`
			`}`

			`// Write to the bucket.`
			`if err := b.Put(k, buf.Bytes()); err != nil {`
			`return fmt.Errorf("put: %s", err)`
			`}`
			`}`
			`}`

Intermediate commit. 2014-11-04 04:15:58 +00:00			`return nil`
			`})`
			`}`

Integrating query into shards. 2014-11-06 06:03:35 +00:00			`func (s *Shard) deleteSeries(name string) error {`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`panic("not yet implemented") // TODO`
			`}`

Add basic query code into the database. 2014-11-07 01:18:36 +00:00			`// query executes a query against the shard and returns results to a channel.`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`func (s Shard) query(spec parser.QuerySpec, name string, fields []Field, resp chan<- protocol.Response) {`
Add basic query code into the database. 2014-11-07 01:18:36 +00:00			`log4go.Debug("QUERY: shard %d, query '%s'", s.ID, spec.GetQueryStringWithTimeCondition())`
			`defer recoverFunc(spec.Database(), spec.GetQueryStringWithTimeCondition(), func(err interface{}) {`
			`resp <- &protocol.Response{`
			`Type: protocol.Response_ERROR.Enum(),`
			`ErrorMessage: protocol.String(fmt.Sprintf("%s", err)),`
			`}`
			`})`

			`var err error`
			`var p engine.Processor`
			`p = NewResponseChannelProcessor(NewResponseChannelWrapper(resp))`
			`p = NewShardIdInserterProcessor(s.ID, p)`

			`if p, err = s.processor(spec, p); err != nil {`
			`resp <- &protocol.Response{`
			`Type: protocol.Response_ERROR.Enum(),`
			`ErrorMessage: protocol.String(err.Error()),`
			`}`
			`log4go.Error("error while creating engine: %s", err)`
			`return`
			`}`
			`log4go.Info("processor chain: %s\n", engine.ProcessorChain(p))`

			`// Execute by type of query.`
			`switch t := spec.SelectQuery().FromClause.Type; t {`
			`case parser.FromClauseArray:`
			`log4go.Debug("shard %s: running a regular query")`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`err = s.executeArrayQuery(spec, name, fields, p)`
Add basic query code into the database. 2014-11-07 01:18:36 +00:00
			`// TODO`
			`//case parser.FromClauseMerge, parser.FromClauseInnerJoin:`
			`// log4go.Debug("shard %s: running a merge query")`
			`// err = s.executeMergeQuery(querySpec, processor, t)`

			`default:`
			`panic(fmt.Errorf("unknown from clause type %s", t))`
			`}`
			`if err != nil {`
			`resp <- &protocol.Response{`
			`Type: protocol.Response_ERROR.Enum(),`
			`ErrorMessage: protocol.String(err.Error()),`
			`}`
			`return`
			`}`

			`_ = p.Close()`
			`resp <- &protocol.Response{Type: protocol.Response_END_STREAM.Enum()}`
			`}`

			`func (s Shard) processor(spec parser.QuerySpec, p engine.Processor) (engine.Processor, error) {`
			`// We should aggregate at the shard level.`
			`q := spec.SelectQuery()`
			`if spec.CanAggregateLocally(s.Duration()) {`
			`log4go.Debug("creating a query engine")`
			`var err error`
			`if p, err = engine.NewQueryEngine(p, q, nil); err != nil {`
			`return nil, err`
			`}`
			`if q != nil && q.GetFromClause().Type != parser.FromClauseInnerJoin {`
			`p = engine.NewFilteringEngine(q, p)`
			`}`
			`return p, nil`
			`}`

			`// We shouldn't limit the queries if they have aggregates and aren't`
			`// aggregated locally, otherwise the aggregation result which happen`
			`// in the coordinator will get partial data and will be incorrect`
			`if q.HasAggregates() {`
			`log4go.Debug("creating a passthrough engine")`
			`p = engine.NewPassthroughEngine(p, 1000)`
			`if q != nil && q.GetFromClause().Type != parser.FromClauseInnerJoin {`
			`p = engine.NewFilteringEngine(q, p)`
			`}`
			`return p, nil`
			`}`

			`// This is an optimization so we don't send more data that we should`
			`// over the wire. The coordinator has its own Passthrough which does`
			`// the final limit.`
			`if q.Limit > 0 {`
			`log4go.Debug("creating a passthrough engine with limit")`
			`p = engine.NewPassthroughEngineWithLimit(p, 1000, q.Limit)`
			`}`

			`return p, nil`
			`}`

Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`func (s Shard) executeArrayQuery(spec parser.QuerySpec, name string, fields []*Field, processor engine.Processor) error {`
			`fnames := Fields(fields).Names()`
			`aliases := spec.SelectQuery().GetTableAliases(name)`
Intermediate commit. 2014-11-04 04:15:58 +00:00
			`// Create a new iterator.`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`i, err := s.iterator(fields)`
			`if err != nil {`
			`return fmt.Errorf("iterator: %s", err)`
			`}`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`defer func() { _ = i.close() }()`

Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`i.startTime = spec.GetStartTime()`
			`i.endTime = spec.GetEndTime()`
			`i.ascending = spec.SelectQuery().Ascending`

Intermediate commit. 2014-11-04 04:15:58 +00:00			`// Iterate over each point and yield to the processor for each alias.`
			`for p := i.first(); p != nil; p = i.next() {`
			`for _, alias := range aliases {`
			`series := &protocol.Series{`
			`Name: proto.String(alias),`
			`Fields: fnames,`
			`Points: []*protocol.Point{p},`
			`}`

			`log4go.Debug("Yielding to %s %s", processor.Name(), series)`
			`if ok, err := processor.Yield(series); err != nil {`
			`log4go.Error("Error while processing data: %v", err)`
			`return err`
			`} else if !ok {`
			`log4go.Debug("Stopping processing.")`
			`// NOTE: This doesn't stop processing.`
			`}`
			`}`
			`}`

Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`log4go.Debug("Finished running query %s", spec.GetQueryString())`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`return nil`
			`}`

			`// iterator returns a new iterator for a set of fields.`
Integrating query into shards. 2014-11-06 06:03:35 +00:00			`func (s Shard) iterator(fields []Field) (*iterator, error) {`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`// Open a read-only transaction.`
			`// This transaction must be closed separately by the iterator.`
			`tx, err := s.store.Begin(false)`
			`if err != nil {`
			`return nil, err`
			`}`

			`// Initialize cursor.`
			`i := &iterator{`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`tx: tx,`
			`fields: fields,`
			`cursors: make([]*bolt.Cursor, len(fields)),`
			`values: make([]rawValue, len(fields)),`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`}`

			`// Open a cursor for each field.`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`for j := range fields {`
			`i.cursors[j] = tx.Bucket([]byte("values")).Cursor()`
			`}`
Intermediate commit. 2014-11-04 04:15:58 +00:00
			`return i, nil`
			`}`

Add basic query code into the database. 2014-11-07 01:18:36 +00:00			`// Shards represents a list of shards.`
			`type Shards []*Shard`

			`// IDs returns a slice of all shard ids.`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`func (p Shards) IDs() []uint64 {`
			`ids := make([]uint64, len(p))`
Add basic query code into the database. 2014-11-07 01:18:36 +00:00			`for i, s := range p {`
			`ids[i] = s.ID`
			`}`
			`return ids`
			`}`

Integrating query into shards. 2014-11-06 06:03:35 +00:00			`// shardsAsc represents a list of shards, sortable in ascending order.`
			`type shardsAsc []*Shard`

			`func (p shardsAsc) Len() int { return len(p) }`
			`func (p shardsAsc) Less(i, j int) bool { return !p[i].StartTime.Before(p[j].StartTime) }`
			`func (p shardsAsc) Swap(i, j int) { p[i], p[j] = p[j], p[i] }`

			`// shardsDesc represents a list of shards, sortable in descending order.`
			`type shardsDesc []*Shard`

			`func (p shardsDesc) Len() int { return len(p) }`
			`func (p shardsDesc) Less(i, j int) bool { return p[i].StartTime.Before(p[j].StartTime) }`
			`func (p shardsDesc) Swap(i, j int) { p[i], p[j] = p[j], p[i] }`

Intermediate commit. 2014-11-04 04:15:58 +00:00			`// storageKey is the key that we use to store values in our key/value`
			`// store engine. The key contains the field id, timestamp and sequence`
			`// number of the value being stored.`
			`type storageKey struct {`
			`bytesBuf []byte`
			`id uint64`
			`timestamp int64`
			`seq uint64`
			`}`

			`// Create a new storageKey.`
			`// timestamp: the timestamp in microseconds. timestamp can be negative.`
			`func newStorageKey(id uint64, timestamp int64, seq uint64) storageKey {`
			`return storageKey{`
			`bytesBuf: nil,`
			`id: id,`
			`timestamp: timestamp,`
			`seq: seq,`
			`}`
			`}`

			`// Parse the given byte slice into a storageKey`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`func unmarshalStorageKey(b []byte) (storageKey, error) {`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`if len(b) != 8*3 {`
			`return storageKey{}, fmt.Errorf("Expected %d fields, found %d", 8*3, len(b))`
			`}`

			`sk := storageKey{}`
			`buf := bytes.NewBuffer(b)`
			`binary.Read(buf, binary.BigEndian, &sk.id)`
			`var t uint64`
			`binary.Read(buf, binary.BigEndian, &t)`
			`sk.timestamp = convertUintTimestampToInt64(t)`
			`binary.Read(buf, binary.BigEndian, &sk.seq)`
			`sk.bytesBuf = b`
			`return sk, nil`
			`}`

Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`// mustUnmarshalStorageKey parses a storage key and panics if cannot be parsed.`
			`func mustUnmarshalStorageKey(b []byte) storageKey {`
			`sk, err := unmarshalStorageKey(b)`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`if err != nil {`
			`panic(err)`
			`}`
			`return sk`
			`}`

Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`// marshalStorageKey converts a storage key to a byte slice.`
			`// Byte slice is cached for reuse.`
			`func marshalStorageKey(sk storageKey) []byte {`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`if sk.bytesBuf != nil {`
			`return sk.bytesBuf`
			`}`

			`buf := bytes.NewBuffer(nil)`
			`binary.Write(buf, binary.BigEndian, sk.id)`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`binary.Write(buf, binary.BigEndian, convertTimestampToUint(sk.timestamp))`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`binary.Write(buf, binary.BigEndian, sk.seq)`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00
			`// Cache key on the storage key.`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`sk.bytesBuf = buf.Bytes()`
			`return sk.bytesBuf`
			`}`

			`func (sk storageKey) time() time.Time {`
			`return time.Unix(0, sk.timestamp*int64(time.Microsecond))`
			`}`

			`func convertTimestampToUint(t int64) uint64 {`
			`if t < 0 {`
			`return uint64(math.MaxInt64 + t + 1)`
			`}`
			`return uint64(t) + uint64(math.MaxInt64) + uint64(1)`
			`}`

			`func convertUintTimestampToInt64(t uint64) int64 {`
			`if t > uint64(math.MaxInt64) {`
			`return int64(t-math.MaxInt64) - int64(1)`
			`}`
			`return int64(t) - math.MaxInt64 - int64(1)`
			`}`

			`// iterator takes a slice of iterators and their corresponding`
			`// fields and turn it into a point iterator, i.e. an iterator that`
			`// yields whole points instead of column values.`
			`type iterator struct {`
			`tx *bolt.Tx`
			`cursors []*bolt.Cursor`

			`fields []*Field`
			`values []rawValue`

			`startTime time.Time`
			`endTime time.Time`
			`ascending bool`

			`valid bool`
			`err error`

			`point *protocol.Point`
			`}`

			`// close closes the read transaction and clears the cursors.`
			`func (i *iterator) close() (err error) {`
			`err = i.tx.Rollback()`
			`i.tx = nil`
			`i.cursors = nil`
			`return`
			`}`

			`// first moves the iterator to the first point.`
			`func (i iterator) first() protocol.Point {`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`i.valid = false`

			`for j, c := range i.cursors {`
			`// Read next key/value.`
			`k, v := c.Seek(marshalStorageKey(newStorageKey(i.fields[j].ID, convertUintTimestampToInt64(uint64(i.startTime.UnixNano())), 0)))`
			`if k == nil {`
			`continue`
			`}`

			`sk := mustUnmarshalStorageKey(k)`
			`if sk.id != i.fields[j].ID {`
			`log4go.Debug("first: different id reached")`
			`continue`
			`} else if sk.time().Before(i.startTime) \|\| sk.time().After(i.endTime) {`
			`log4go.Debug("first: outside time range: %s, %s", sk.time(), i.startTime)`
			`continue`
			`}`

			`// Set the value for the field.`
			`i.values[j] = rawValue{time: sk.timestamp, sequence: sk.seq, value: v}`
			`}`

			`return i.materialize()`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`}`

			`// next moves the cursor to the next point.`
			`func (i iterator) next() protocol.Point {`
			`i.valid = false`

			`// Move the cursors to the next value.`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`for j, c := range i.cursors {`
			`// Ignore cursors which already have a value.`
			`if i.values[j].value != nil {`
			`continue`
			`}`

			`// Read next key/value.`
			`k, v := c.Next()`
			`if k == nil {`
			`continue`
			`}`

			`// Move to the next iterator if different field reached.`
			`// Move to the next iterator if outside of time range.`
			`sk := mustUnmarshalStorageKey(k)`
			`if sk.id != i.fields[j].ID {`
			`log4go.Debug("different id reached")`
			`continue`
			`} else if sk.time().Before(i.startTime) \|\| sk.time().After(i.endTime) {`
			`log4go.Debug("Outside time range: %s, %s", sk.time(), i.startTime)`
			`continue`
			`}`
Intermediate commit. 2014-11-04 04:15:58 +00:00
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`// Set the value for the field.`
			`i.values[j] = rawValue{time: sk.timestamp, sequence: sk.seq, value: v}`
			`log4go.Debug("Iterator next value: %v", i.values[j])`
			`}`

			`return i.materialize()`
			`}`

			`// materialize creates a point from the current values and move the cursors forward.`
			`func (i iterator) materialize() protocol.Point {`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`// choose the highest (or lowest in case of ascending queries) timestamp`
			`// and sequence number. that will become the timestamp and sequence of`
			`// the next point.`
			`var next *rawValue`
			`for j, value := range i.values {`
			`// Ignore nil values.`
			`if value.value == nil {`
			`continue`
			`}`

			`// Initialize next value if not set.`
			`// Otherwise override next if value is before (ASC) or after (DESC).`
			`if next == nil {`
			`next = &i.values[j]`
			`} else if i.ascending && value.before(next) {`
			`next = &i.values[j]`
			`} else if !i.ascending && value.after(next) {`
			`next = &i.values[j]`
			`}`
			`}`

			`// Set values to point that match the timestamp & sequence number.`
Query engine and parser integration into root pkg. 2014-11-10 02:55:53 +00:00			`buf := proto.NewBuffer(nil)`
			`point := &protocol.Point{Values: make([]*protocol.FieldValue, len(i.fields))}`
Intermediate commit. 2014-11-04 04:15:58 +00:00			`for j, c := range i.cursors {`
			`value := &i.values[j]`
			`log4go.Debug("Column value: %s", value)`

			`// Skip value if it doesn't match point's timestamp and seq number.`
			`if value.value == nil \|\| value.time != next.time \|\| value.sequence != next.sequence {`
			`trueValue := true`
			`point.Values[j] = &protocol.FieldValue{IsNull: &trueValue}`
			`continue`
			`}`

			`// Iterator is valid if at least one column is set.`
			`log4go.Debug("Setting is valid to true")`
			`i.valid = true`

			`// Advance the iterator to read a new value in the next iteration`
			`if i.ascending {`
			`c.Next()`
			`} else {`
			`c.Prev()`
			`}`

			`// Marshal value from protobufs into point.`
			`fv := &protocol.FieldValue{}`
			`buf.SetBuf(value.value)`
			`if err := buf.Unmarshal(fv); err != nil {`
			`log4go.Error("Error while running query: %s", err)`
			`i.err, i.valid = err, false`
			`return nil`
			`}`
			`point.Values[j] = fv`
			`value.value = nil`
			`}`

			`// This will only happen if there are no points for the given series`
			`// and range and this is the first call to Next(). Otherwise we`
			`// always call Next() on a valid iterator so we know we have`
			`// more points`
			`if next == nil {`
			`return nil`
			`}`

			`// Set timestamp and sequence number on point.`
			`point.SetTimestampInMicroseconds(next.time)`
			`point.SequenceNumber = proto.Uint64(next.sequence)`

			`return point`
			`}`

			`// rawValue represents the value for a field at a given time and sequence id.`
			`type rawValue struct {`
			`time int64`
			`sequence uint64`
			`value []byte`
			`}`

			`// before returns true if the value is before another value.`
			`func (v rawValue) before(other *rawValue) bool {`
			`return (v.time < other.time) \|\| (v.time == other.time && v.sequence < other.sequence)`
			`}`

			`// after returns true if the value is after another value.`
			`func (v rawValue) after(other *rawValue) bool {`
			`return (v.time > other.time) \|\| (v.time == other.time && v.sequence > other.sequence)`
			`}`

			`func (v rawValue) String() string {`
			`return fmt.Sprintf("[time: %d, sequence: %d, value: %v]", v.time, v.sequence, v.value)`
			`}`