influxdb/query/execute/executor.go

// Package execute contains the implementation of the execution phase in the query engine.
package execute

import (
	"context"
	"fmt"
	"runtime/debug"
	"time"

	"github.com/influxdata/platform"
	"github.com/influxdata/platform/query"
	"github.com/influxdata/platform/query/plan"
	"github.com/pkg/errors"
	"go.uber.org/zap"
	"go.uber.org/zap/zapcore"
)

type Executor interface {
	Execute(ctx context.Context, orgID platform.ID, p *plan.PlanSpec, a *Allocator) (map[string]query.Result, error)
}

type executor struct {
	deps   Dependencies
	logger *zap.Logger
}

func NewExecutor(deps Dependencies, logger *zap.Logger) Executor {
	if logger == nil {
		logger = zap.NewNop()
	}
	e := &executor{
		deps:   deps,
		logger: logger,
	}
	return e
}

type streamContext struct {
	bounds Bounds
}

func newStreamContext(b Bounds) streamContext {
	return streamContext{
		bounds: b,
	}
}

func (ctx streamContext) Bounds() Bounds {
	return ctx.bounds
}

type executionState struct {
	p    *plan.PlanSpec
	deps Dependencies

	orgID platform.ID

	alloc *Allocator

	resources query.ResourceManagement

	results map[string]query.Result
	sources []Source

	transports []Transport

	dispatcher *poolDispatcher
	logger     *zap.Logger
}

func (e *executor) Execute(ctx context.Context, orgID platform.ID, p *plan.PlanSpec, a *Allocator) (map[string]query.Result, error) {
	es, err := e.createExecutionState(ctx, orgID, p, a)
	if err != nil {
		return nil, errors.Wrap(err, "failed to initialize execute state")
	}
	es.logger = e.logger
	es.do(ctx)
	return es.results, nil
}

func validatePlan(p *plan.PlanSpec) error {
	if p.Resources.ConcurrencyQuota == 0 {
		return errors.New("plan must have a non-zero concurrency quota")
	}
	return nil
}

func (e *executor) createExecutionState(ctx context.Context, orgID platform.ID, p *plan.PlanSpec, a *Allocator) (*executionState, error) {
	if err := validatePlan(p); err != nil {
		return nil, errors.Wrap(err, "invalid plan")
	}
	// Set allocation limit
	a.Limit = p.Resources.MemoryBytesQuota
	es := &executionState{
		orgID:     orgID,
		p:         p,
		deps:      e.deps,
		alloc:     a,
		resources: p.Resources,
		results:   make(map[string]query.Result, len(p.Results)),
		// TODO(nathanielc): Have the planner specify the dispatcher throughput
		dispatcher: newPoolDispatcher(10, e.logger),
	}
	nodes := make(map[plan.ProcedureID]Node, len(p.Procedures))
	for name, yield := range p.Results {
		ds, err := es.createNode(ctx, p.Procedures[yield.ID], nodes)
		if err != nil {
			return nil, err
		}
		r := newResult(name, yield)
		ds.AddTransformation(r)
		es.results[name] = r
	}
	return es, nil
}

// DefaultTriggerSpec defines the triggering that should be used for datasets
// whose parent transformation is not a windowing transformation.
var DefaultTriggerSpec = query.AfterWatermarkTriggerSpec{}

type triggeringSpec interface {
	TriggerSpec() query.TriggerSpec
}

func (es *executionState) createNode(ctx context.Context, pr *plan.Procedure, nodes map[plan.ProcedureID]Node) (Node, error) {
	// Check if we already created this node
	if n, ok := nodes[pr.ID]; ok {
		return n, nil
	}

	// Build execution context
	ec := executionContext{
		es: es,
		streamContext: newStreamContext(Bounds{
			Start: resolveTime(pr.Bounds.Start, es.p.Now),
			Stop:  resolveTime(pr.Bounds.Stop, es.p.Now),
		}),
	}

	if len(pr.Parents) > 0 {
		ec.parents = make([]DatasetID, len(pr.Parents))
		for i, parentID := range pr.Parents {
			ec.parents[i] = DatasetID(parentID)
		}
	}

	// If source create source
	if createS, ok := procedureToSource[pr.Spec.Kind()]; ok {
		s, err := createS(pr.Spec, DatasetID(pr.ID), ec)
		if err != nil {
			return nil, err
		}
		es.sources = append(es.sources, s)
		nodes[pr.ID] = s
		return s, nil
	}

	createT, ok := procedureToTransformation[pr.Spec.Kind()]
	if !ok {
		return nil, fmt.Errorf("unsupported procedure %v", pr.Spec.Kind())
	}

	// Create the transformation
	t, ds, err := createT(DatasetID(pr.ID), AccumulatingMode, pr.Spec, ec)
	if err != nil {
		return nil, err
	}
	nodes[pr.ID] = ds

	// Setup triggering
	var ts query.TriggerSpec = DefaultTriggerSpec
	if t, ok := pr.Spec.(triggeringSpec); ok {
		ts = t.TriggerSpec()
	}
	ds.SetTriggerSpec(ts)

	// Recurse creating parents
	for _, parentID := range pr.Parents {
		parent, err := es.createNode(ctx, es.p.Procedures[parentID], nodes)
		if err != nil {
			return nil, err
		}
		transport := newConescutiveTransport(es.dispatcher, t)
		es.transports = append(es.transports, transport)
		parent.AddTransformation(transport)
	}

	return ds, nil
}

func (es *executionState) abort(err error) {
	for _, r := range es.results {
		r.(*result).abort(err)
	}
}

func (es *executionState) do(ctx context.Context) {
	for _, src := range es.sources {
		go func(src Source) {
			// Setup panic handling on the source goroutines
			defer func() {
				if e := recover(); e != nil {
					// We had a panic, abort the entire execution.
					var err error
					switch e := e.(type) {
					case error:
						err = e
					default:
						err = fmt.Errorf("%v", e)
					}
					es.abort(fmt.Errorf("panic: %v\n%s", err, debug.Stack()))
					if entry := es.logger.Check(zapcore.InfoLevel, "Execute source panic"); entry != nil {
						entry.Stack = string(debug.Stack())
						entry.Write(zap.Error(err))
					}
				}
			}()
			src.Run(ctx)
		}(src)
	}
	es.dispatcher.Start(es.resources.ConcurrencyQuota, ctx)
	go func() {
		// Wait for all transports to finish
		for _, t := range es.transports {
			select {
			case <-t.Finished():
			case <-ctx.Done():
				es.abort(errors.New("context done"))
			case err := <-es.dispatcher.Err():
				if err != nil {
					es.abort(err)
				}
			}
		}
		// Check for any errors on the dispatcher
		err := es.dispatcher.Stop()
		if err != nil {
			es.abort(err)
		}
	}()
}

// Need a unique stream context per execution context
type executionContext struct {
	es            *executionState
	parents       []DatasetID
	streamContext streamContext
}

// Satisfy the ExecutionContext interface
func (ec executionContext) OrganizationID() platform.ID {
	return ec.es.orgID
}

func resolveTime(qt query.Time, now time.Time) Time {
	return Time(qt.Time(now).UnixNano())
}

func (ec executionContext) ResolveTime(qt query.Time) Time {
	return resolveTime(qt, ec.es.p.Now)
}

func (ec executionContext) StreamContext() StreamContext {
	return ec.streamContext
}

func (ec executionContext) Allocator() *Allocator {
	return ec.es.alloc
}

func (ec executionContext) Parents() []DatasetID {
	return ec.parents
}
func (ec executionContext) ConvertID(id plan.ProcedureID) DatasetID {
	return DatasetID(id)
}

func (ec executionContext) Dependencies() Dependencies {
	return ec.es.deps
}
docs(query): add package docs for the packages in the query package 2018-08-13 20:15:44 +00:00			`// Package execute contains the implementation of the execution phase in the query engine.`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`package execute`

			`import (`
			`"context"`
			`"fmt"`
			`"runtime/debug"`
Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00			`"time"`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00
chore(query): remove usage of query/id package It was effectively a copied and pasted platform.ID, so change it to a type alias. Once our known references to the query/id package are updated to platform.ID, we'll delete the package. 2018-06-15 22:47:40 +00:00			`"github.com/influxdata/platform"`
rewrite imports 2018-05-21 21:20:06 +00:00			`"github.com/influxdata/platform/query"`
			`"github.com/influxdata/platform/query/plan"`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`"github.com/pkg/errors"`
feat(query): log panics with their stacktraces within the query executor The logger is now threaded into the query controller, executor, and the dispatcher so that we can log panics. They are logged at the info level because the panics do not result in the system crashing and becoming unusable. 2018-08-15 20:13:23 +00:00			`"go.uber.org/zap"`
			`"go.uber.org/zap/zapcore"`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`)`

			`type Executor interface {`
feat: Add query statistics Introduces the Statisticser interface which ResultIterators may implement. The HTTP implementation uses HTTP trailers to preserve the statistics. This way we do not need to have all encoders and decoders support statistics. 2018-07-13 18:56:09 +00:00			`Execute(ctx context.Context, orgID platform.ID, p plan.PlanSpec, a Allocator) (map[string]query.Result, error)`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`

			`type executor struct {`
feat(query): log panics with their stacktraces within the query executor The logger is now threaded into the query controller, executor, and the dispatcher so that we can log panics. They are logged at the info level because the panics do not result in the system crashing and becoming unusable. 2018-08-15 20:13:23 +00:00			`deps Dependencies`
			`logger *zap.Logger`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`

feat(query): log panics with their stacktraces within the query executor The logger is now threaded into the query controller, executor, and the dispatcher so that we can log panics. They are logged at the info level because the panics do not result in the system crashing and becoming unusable. 2018-08-15 20:13:23 +00:00			`func NewExecutor(deps Dependencies, logger *zap.Logger) Executor {`
			`if logger == nil {`
			`logger = zap.NewNop()`
			`}`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`e := &executor{`
feat(query): log panics with their stacktraces within the query executor The logger is now threaded into the query controller, executor, and the dispatcher so that we can log panics. They are logged at the info level because the panics do not result in the system crashing and becoming unusable. 2018-08-15 20:13:23 +00:00			`deps: deps,`
			`logger: logger,`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`
			`return e`
			`}`

Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00			`type streamContext struct {`
			`bounds Bounds`
			`}`

			`func newStreamContext(b Bounds) streamContext {`
			`return streamContext{`
			`bounds: b,`
			`}`
			`}`

			`func (ctx streamContext) Bounds() Bounds {`
			`return ctx.bounds`
			`}`

initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`type executionState struct {`
			`p *plan.PlanSpec`
			`deps Dependencies`

chore(query): remove usage of query/id package It was effectively a copied and pasted platform.ID, so change it to a type alias. Once our known references to the query/id package are updated to platform.ID, we'll delete the package. 2018-06-15 22:47:40 +00:00			`orgID platform.ID`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00
			`alloc *Allocator`

			`resources query.ResourceManagement`

move types around to avoid cyclic imports 2018-05-21 23:02:42 +00:00			`results map[string]query.Result`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`sources []Source`

			`transports []Transport`

			`dispatcher *poolDispatcher`
feat(query): log panics with their stacktraces within the query executor The logger is now threaded into the query controller, executor, and the dispatcher so that we can log panics. They are logged at the info level because the panics do not result in the system crashing and becoming unusable. 2018-08-15 20:13:23 +00:00			`logger *zap.Logger`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`

feat: Add query statistics Introduces the Statisticser interface which ResultIterators may implement. The HTTP implementation uses HTTP trailers to preserve the statistics. This way we do not need to have all encoders and decoders support statistics. 2018-07-13 18:56:09 +00:00			`func (e executor) Execute(ctx context.Context, orgID platform.ID, p plan.PlanSpec, a *Allocator) (map[string]query.Result, error) {`
			`es, err := e.createExecutionState(ctx, orgID, p, a)`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`if err != nil {`
			`return nil, errors.Wrap(err, "failed to initialize execute state")`
			`}`
feat(query): log panics with their stacktraces within the query executor The logger is now threaded into the query controller, executor, and the dispatcher so that we can log panics. They are logged at the info level because the panics do not result in the system crashing and becoming unusable. 2018-08-15 20:13:23 +00:00			`es.logger = e.logger`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`es.do(ctx)`
			`return es.results, nil`
			`}`

			`func validatePlan(p *plan.PlanSpec) error {`
			`if p.Resources.ConcurrencyQuota == 0 {`
			`return errors.New("plan must have a non-zero concurrency quota")`
			`}`
			`return nil`
			`}`

feat: Add query statistics Introduces the Statisticser interface which ResultIterators may implement. The HTTP implementation uses HTTP trailers to preserve the statistics. This way we do not need to have all encoders and decoders support statistics. 2018-07-13 18:56:09 +00:00			`func (e executor) createExecutionState(ctx context.Context, orgID platform.ID, p plan.PlanSpec, a Allocator) (executionState, error) {`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`if err := validatePlan(p); err != nil {`
			`return nil, errors.Wrap(err, "invalid plan")`
			`}`
feat: Add query statistics Introduces the Statisticser interface which ResultIterators may implement. The HTTP implementation uses HTTP trailers to preserve the statistics. This way we do not need to have all encoders and decoders support statistics. 2018-07-13 18:56:09 +00:00			`// Set allocation limit`
			`a.Limit = p.Resources.MemoryBytesQuota`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`es := &executionState{`
feat: Add query statistics Introduces the Statisticser interface which ResultIterators may implement. The HTTP implementation uses HTTP trailers to preserve the statistics. This way we do not need to have all encoders and decoders support statistics. 2018-07-13 18:56:09 +00:00			`orgID: orgID,`
			`p: p,`
			`deps: e.deps,`
			`alloc: a,`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`resources: p.Resources,`
move types around to avoid cyclic imports 2018-05-21 23:02:42 +00:00			`results: make(map[string]query.Result, len(p.Results)),`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`// TODO(nathanielc): Have the planner specify the dispatcher throughput`
feat(query): log panics with their stacktraces within the query executor The logger is now threaded into the query controller, executor, and the dispatcher so that we can log panics. They are logged at the info level because the panics do not result in the system crashing and becoming unusable. 2018-08-15 20:13:23 +00:00			`dispatcher: newPoolDispatcher(10, e.logger),`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`
			`nodes := make(map[plan.ProcedureID]Node, len(p.Procedures))`
			`for name, yield := range p.Results {`
			`ds, err := es.createNode(ctx, p.Procedures[yield.ID], nodes)`
			`if err != nil {`
			`return nil, err`
			`}`
fix(query/csv): Encode result iterator errors This change also adds Name() to the Result interface to allow for correct MultiResultEncoding. 2018-05-24 17:29:36 +00:00			`r := newResult(name, yield)`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`ds.AddTransformation(r)`
			`es.results[name] = r`
			`}`
			`return es, nil`
			`}`

			`// DefaultTriggerSpec defines the triggering that should be used for datasets`
			`// whose parent transformation is not a windowing transformation.`
			`var DefaultTriggerSpec = query.AfterWatermarkTriggerSpec{}`

			`type triggeringSpec interface {`
			`TriggerSpec() query.TriggerSpec`
			`}`

			`func (es executionState) createNode(ctx context.Context, pr plan.Procedure, nodes map[plan.ProcedureID]Node) (Node, error) {`
			`// Check if we already created this node`
			`if n, ok := nodes[pr.ID]; ok {`
			`return n, nil`
			`}`
Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`// Build execution context`
			`ec := executionContext{`
			`es: es,`
Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00			`streamContext: newStreamContext(Bounds{`
			`Start: resolveTime(pr.Bounds.Start, es.p.Now),`
			`Stop: resolveTime(pr.Bounds.Stop, es.p.Now),`
			`}),`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`
Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`if len(pr.Parents) > 0 {`
			`ec.parents = make([]DatasetID, len(pr.Parents))`
			`for i, parentID := range pr.Parents {`
			`ec.parents[i] = DatasetID(parentID)`
			`}`
			`}`

			`// If source create source`
			`if createS, ok := procedureToSource[pr.Spec.Kind()]; ok {`
			`s, err := createS(pr.Spec, DatasetID(pr.ID), ec)`
			`if err != nil {`
			`return nil, err`
			`}`
			`es.sources = append(es.sources, s)`
			`nodes[pr.ID] = s`
			`return s, nil`
			`}`

			`createT, ok := procedureToTransformation[pr.Spec.Kind()]`
			`if !ok {`
			`return nil, fmt.Errorf("unsupported procedure %v", pr.Spec.Kind())`
			`}`

			`// Create the transformation`
			`t, ds, err := createT(DatasetID(pr.ID), AccumulatingMode, pr.Spec, ec)`
			`if err != nil {`
			`return nil, err`
			`}`
			`nodes[pr.ID] = ds`

			`// Setup triggering`
			`var ts query.TriggerSpec = DefaultTriggerSpec`
			`if t, ok := pr.Spec.(triggeringSpec); ok {`
			`ts = t.TriggerSpec()`
			`}`
			`ds.SetTriggerSpec(ts)`

			`// Recurse creating parents`
			`for _, parentID := range pr.Parents {`
			`parent, err := es.createNode(ctx, es.p.Procedures[parentID], nodes)`
			`if err != nil {`
			`return nil, err`
			`}`
			`transport := newConescutiveTransport(es.dispatcher, t)`
			`es.transports = append(es.transports, transport)`
			`parent.AddTransformation(transport)`
			`}`

			`return ds, nil`
			`}`

			`func (es *executionState) abort(err error) {`
			`for _, r := range es.results {`
			`r.(*result).abort(err)`
			`}`
			`}`

			`func (es *executionState) do(ctx context.Context) {`
			`for _, src := range es.sources {`
			`go func(src Source) {`
			`// Setup panic handling on the source goroutines`
			`defer func() {`
			`if e := recover(); e != nil {`
			`// We had a panic, abort the entire execution.`
			`var err error`
			`switch e := e.(type) {`
			`case error:`
			`err = e`
			`default:`
			`err = fmt.Errorf("%v", e)`
			`}`
			`es.abort(fmt.Errorf("panic: %v\n%s", err, debug.Stack()))`
feat(query): log panics with their stacktraces within the query executor The logger is now threaded into the query controller, executor, and the dispatcher so that we can log panics. They are logged at the info level because the panics do not result in the system crashing and becoming unusable. 2018-08-15 20:13:23 +00:00			`if entry := es.logger.Check(zapcore.InfoLevel, "Execute source panic"); entry != nil {`
			`entry.Stack = string(debug.Stack())`
			`entry.Write(zap.Error(err))`
			`}`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`
			`}()`
			`src.Run(ctx)`
			`}(src)`
			`}`
			`es.dispatcher.Start(es.resources.ConcurrencyQuota, ctx)`
			`go func() {`
			`// Wait for all transports to finish`
			`for _, t := range es.transports {`
			`select {`
			`case <-t.Finished():`
			`case <-ctx.Done():`
			`es.abort(errors.New("context done"))`
			`case err := <-es.dispatcher.Err():`
			`if err != nil {`
			`es.abort(err)`
			`}`
			`}`
			`}`
			`// Check for any errors on the dispatcher`
			`err := es.dispatcher.Stop()`
			`if err != nil {`
			`es.abort(err)`
			`}`
			`}()`
			`}`

Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00			`// Need a unique stream context per execution context`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`type executionContext struct {`
Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00			`es *executionState`
			`parents []DatasetID`
			`streamContext streamContext`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`

			`// Satisfy the ExecutionContext interface`
chore(query): remove usage of query/id package It was effectively a copied and pasted platform.ID, so change it to a type alias. Once our known references to the query/id package are updated to platform.ID, we'll delete the package. 2018-06-15 22:47:40 +00:00			`func (ec executionContext) OrganizationID() platform.ID {`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`return ec.es.orgID`
			`}`

Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00			`func resolveTime(qt query.Time, now time.Time) Time {`
			`return Time(qt.Time(now).UnixNano())`
			`}`

initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`func (ec executionContext) ResolveTime(qt query.Time) Time {`
Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00			`return resolveTime(qt, ec.es.p.Now)`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`
Add Stream Context to Executor (#609) Add stream context with bounds to planner/execution engine 2018-08-14 23:18:59 +00:00
			`func (ec executionContext) StreamContext() StreamContext {`
			`return ec.streamContext`
initial copy of ifql repo 2018-05-21 21:13:54 +00:00			`}`

			`func (ec executionContext) Allocator() *Allocator {`
			`return ec.es.alloc`
			`}`

			`func (ec executionContext) Parents() []DatasetID {`
			`return ec.parents`
			`}`
			`func (ec executionContext) ConvertID(id plan.ProcedureID) DatasetID {`
			`return DatasetID(id)`
			`}`

			`func (ec executionContext) Dependencies() Dependencies {`
			`return ec.es.deps`
			`}`