2021-12-01 14:28:08 +00:00
|
|
|
// Licensed to the LF AI & Data foundation under one
|
|
|
|
// or more contributor license agreements. See the NOTICE file
|
|
|
|
// distributed with this work for additional information
|
|
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
|
|
// to you under the Apache License, Version 2.0 (the
|
|
|
|
// "License"); you may not use this file except in compliance
|
2021-06-09 03:37:55 +00:00
|
|
|
// with the License. You may obtain a copy of the License at
|
|
|
|
//
|
2021-12-01 14:28:08 +00:00
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
2021-06-09 03:37:55 +00:00
|
|
|
//
|
2021-12-01 14:28:08 +00:00
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
2021-06-09 03:37:55 +00:00
|
|
|
|
|
|
|
package querynode
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"errors"
|
2022-03-02 06:49:55 +00:00
|
|
|
"fmt"
|
2022-10-19 05:21:31 +00:00
|
|
|
"time"
|
2021-06-09 03:37:55 +00:00
|
|
|
|
2022-11-07 02:15:02 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/util/typeutil"
|
|
|
|
|
2021-06-09 03:37:55 +00:00
|
|
|
"go.uber.org/zap"
|
|
|
|
|
|
|
|
"github.com/milvus-io/milvus/internal/log"
|
2022-03-02 06:49:55 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/metrics"
|
2022-03-03 13:57:56 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/mq/msgstream"
|
|
|
|
"github.com/milvus-io/milvus/internal/mq/msgstream/mqwrapper"
|
2021-06-09 03:37:55 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/internalpb"
|
|
|
|
"github.com/milvus-io/milvus/internal/util/flowgraph"
|
2022-11-04 06:25:38 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/util/paramtable"
|
2022-10-19 05:21:31 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/util/tsoutil"
|
2021-06-09 03:37:55 +00:00
|
|
|
)
|
|
|
|
|
2022-11-03 07:03:35 +00:00
|
|
|
type (
|
|
|
|
// baseNode is type flowgraph.BaseNode
|
|
|
|
baseNode = flowgraph.BaseNode
|
|
|
|
|
|
|
|
// node is type flowgraph.Node
|
|
|
|
node = flowgraph.Node
|
|
|
|
)
|
|
|
|
|
2021-09-27 11:06:07 +00:00
|
|
|
// queryNodeFlowGraph is a TimeTickedFlowGraph in query node
|
2021-06-09 03:37:55 +00:00
|
|
|
type queryNodeFlowGraph struct {
|
|
|
|
ctx context.Context
|
|
|
|
cancel context.CancelFunc
|
|
|
|
collectionID UniqueID
|
2022-11-03 07:03:35 +00:00
|
|
|
vchannel Channel
|
2021-06-09 03:37:55 +00:00
|
|
|
flowGraph *flowgraph.TimeTickedFlowGraph
|
|
|
|
dmlStream msgstream.MsgStream
|
2022-03-15 13:51:21 +00:00
|
|
|
consumerCnt int
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2021-12-21 13:12:04 +00:00
|
|
|
// newQueryNodeFlowGraph returns a new queryNodeFlowGraph
|
2021-06-09 03:37:55 +00:00
|
|
|
func newQueryNodeFlowGraph(ctx context.Context,
|
|
|
|
collectionID UniqueID,
|
2022-05-31 05:42:03 +00:00
|
|
|
metaReplica ReplicaInterface,
|
2021-06-09 03:37:55 +00:00
|
|
|
tSafeReplica TSafeReplicaInterface,
|
2022-11-03 07:03:35 +00:00
|
|
|
vchannel Channel,
|
2022-03-09 07:17:59 +00:00
|
|
|
factory msgstream.Factory) (*queryNodeFlowGraph, error) {
|
2021-06-09 03:37:55 +00:00
|
|
|
|
|
|
|
ctx1, cancel := context.WithCancel(ctx)
|
|
|
|
|
|
|
|
q := &queryNodeFlowGraph{
|
|
|
|
ctx: ctx1,
|
|
|
|
cancel: cancel,
|
|
|
|
collectionID: collectionID,
|
2022-11-03 07:03:35 +00:00
|
|
|
vchannel: vchannel,
|
2021-06-09 03:37:55 +00:00
|
|
|
flowGraph: flowgraph.NewTimeTickedFlowGraph(ctx1),
|
|
|
|
}
|
|
|
|
|
2022-11-07 02:15:02 +00:00
|
|
|
dmStreamNode, err := q.newDmInputNode(ctx1, factory, collectionID, vchannel, metrics.InsertLabel)
|
2022-03-09 07:17:59 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2022-11-03 07:03:35 +00:00
|
|
|
var filterDmNode node = newFilteredDmNode(metaReplica, collectionID, vchannel)
|
|
|
|
var insertNode node = newInsertNode(metaReplica, collectionID, vchannel)
|
|
|
|
var serviceTimeNode node = newServiceTimeNode(tSafeReplica, collectionID, vchannel)
|
2021-06-09 03:37:55 +00:00
|
|
|
|
|
|
|
q.flowGraph.AddNode(dmStreamNode)
|
|
|
|
q.flowGraph.AddNode(filterDmNode)
|
|
|
|
q.flowGraph.AddNode(insertNode)
|
|
|
|
q.flowGraph.AddNode(serviceTimeNode)
|
|
|
|
|
|
|
|
// dmStreamNode
|
2022-03-09 07:17:59 +00:00
|
|
|
err = q.flowGraph.SetEdges(dmStreamNode.Name(),
|
2021-06-09 03:37:55 +00:00
|
|
|
[]string{filterDmNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", dmStreamNode.Name(), err.Error())
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// filterDmNode
|
|
|
|
err = q.flowGraph.SetEdges(filterDmNode.Name(),
|
|
|
|
[]string{insertNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", filterDmNode.Name(), err.Error())
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// insertNode
|
|
|
|
err = q.flowGraph.SetEdges(insertNode.Name(),
|
|
|
|
[]string{serviceTimeNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", insertNode.Name(), err.Error())
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// serviceTimeNode
|
|
|
|
err = q.flowGraph.SetEdges(serviceTimeNode.Name(),
|
|
|
|
[]string{},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", serviceTimeNode.Name(), err.Error())
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
return q, nil
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2021-12-21 13:13:55 +00:00
|
|
|
// newQueryNodeDeltaFlowGraph returns a new queryNodeFlowGraph
|
2021-11-06 03:02:58 +00:00
|
|
|
func newQueryNodeDeltaFlowGraph(ctx context.Context,
|
|
|
|
collectionID UniqueID,
|
2022-05-31 05:42:03 +00:00
|
|
|
metaReplica ReplicaInterface,
|
2021-11-06 03:02:58 +00:00
|
|
|
tSafeReplica TSafeReplicaInterface,
|
2022-11-03 07:03:35 +00:00
|
|
|
vchannel Channel,
|
2022-03-09 07:17:59 +00:00
|
|
|
factory msgstream.Factory) (*queryNodeFlowGraph, error) {
|
2021-11-06 03:02:58 +00:00
|
|
|
|
|
|
|
ctx1, cancel := context.WithCancel(ctx)
|
|
|
|
|
|
|
|
q := &queryNodeFlowGraph{
|
|
|
|
ctx: ctx1,
|
|
|
|
cancel: cancel,
|
|
|
|
collectionID: collectionID,
|
2022-11-03 07:03:35 +00:00
|
|
|
vchannel: vchannel,
|
2021-11-06 03:02:58 +00:00
|
|
|
flowGraph: flowgraph.NewTimeTickedFlowGraph(ctx1),
|
|
|
|
}
|
|
|
|
|
2022-11-07 02:15:02 +00:00
|
|
|
dmStreamNode, err := q.newDmInputNode(ctx1, factory, collectionID, vchannel, metrics.DeleteLabel)
|
2022-03-09 07:17:59 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2022-11-03 07:03:35 +00:00
|
|
|
var filterDeleteNode node = newFilteredDeleteNode(metaReplica, collectionID, vchannel)
|
|
|
|
var deleteNode node = newDeleteNode(metaReplica, collectionID, vchannel)
|
|
|
|
var serviceTimeNode node = newServiceTimeNode(tSafeReplica, collectionID, vchannel)
|
2021-11-06 03:02:58 +00:00
|
|
|
|
|
|
|
q.flowGraph.AddNode(dmStreamNode)
|
|
|
|
q.flowGraph.AddNode(filterDeleteNode)
|
|
|
|
q.flowGraph.AddNode(deleteNode)
|
|
|
|
q.flowGraph.AddNode(serviceTimeNode)
|
|
|
|
|
|
|
|
// dmStreamNode
|
2022-03-09 07:17:59 +00:00
|
|
|
err = q.flowGraph.SetEdges(dmStreamNode.Name(),
|
2021-11-06 03:02:58 +00:00
|
|
|
[]string{filterDeleteNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", dmStreamNode.Name(), err.Error())
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// filterDmNode
|
|
|
|
err = q.flowGraph.SetEdges(filterDeleteNode.Name(),
|
|
|
|
[]string{deleteNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", filterDeleteNode.Name(), err.Error())
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// insertNode
|
|
|
|
err = q.flowGraph.SetEdges(deleteNode.Name(),
|
|
|
|
[]string{serviceTimeNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", deleteNode.Name(), err.Error())
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// serviceTimeNode
|
|
|
|
err = q.flowGraph.SetEdges(serviceTimeNode.Name(),
|
|
|
|
[]string{},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", serviceTimeNode.Name(), err.Error())
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
return q, nil
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
2021-12-21 13:15:49 +00:00
|
|
|
// newDmInputNode returns a new inputNode
|
2022-11-07 02:15:02 +00:00
|
|
|
|
|
|
|
func (q *queryNodeFlowGraph) newDmInputNode(ctx context.Context, factory msgstream.Factory, collectionID UniqueID, vchannel Channel, dataType string) (*flowgraph.InputNode, error) {
|
2021-06-09 03:37:55 +00:00
|
|
|
insertStream, err := factory.NewTtMsgStream(ctx)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, err
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
q.dmlStream = insertStream
|
|
|
|
|
2021-12-23 10:39:11 +00:00
|
|
|
maxQueueLength := Params.QueryNodeCfg.FlowGraphMaxQueueLength
|
|
|
|
maxParallelism := Params.QueryNodeCfg.FlowGraphMaxParallelism
|
2022-11-03 07:03:35 +00:00
|
|
|
name := fmt.Sprintf("dmInputNode-query-%d-%s", collectionID, vchannel)
|
2022-11-07 02:15:02 +00:00
|
|
|
node := flowgraph.NewInputNode(insertStream, name, maxQueueLength, maxParallelism, typeutil.QueryNodeRole,
|
|
|
|
paramtable.GetNodeID(), collectionID, dataType)
|
2022-03-09 07:17:59 +00:00
|
|
|
return node, nil
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
// consumeFlowGraph would consume by channel and subName
|
|
|
|
func (q *queryNodeFlowGraph) consumeFlowGraph(channel Channel, subName ConsumeSubName) error {
|
2021-06-09 03:37:55 +00:00
|
|
|
if q.dmlStream == nil {
|
|
|
|
return errors.New("null dml message stream in flow graph")
|
|
|
|
}
|
2022-10-25 05:23:30 +00:00
|
|
|
q.dmlStream.AsConsumer([]string{channel}, subName, mqwrapper.SubscriptionPositionUnknown)
|
2022-11-03 07:03:35 +00:00
|
|
|
log.Info("query node flow graph consumes from PositionUnknown",
|
|
|
|
zap.Int64("collectionID", q.collectionID),
|
|
|
|
zap.String("pchannel", channel),
|
|
|
|
zap.String("vchannel", q.vchannel),
|
|
|
|
zap.String("subName", subName),
|
2021-06-15 12:06:10 +00:00
|
|
|
)
|
2022-03-15 13:51:21 +00:00
|
|
|
q.consumerCnt++
|
2022-11-04 06:25:38 +00:00
|
|
|
metrics.QueryNodeNumConsumers.WithLabelValues(fmt.Sprint(paramtable.GetNodeID())).Inc()
|
2021-06-09 03:37:55 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
// consumeFlowGraphFromLatest would consume from latest by channel and subName
|
|
|
|
func (q *queryNodeFlowGraph) consumeFlowGraphFromLatest(channel Channel, subName ConsumeSubName) error {
|
2021-11-20 23:33:14 +00:00
|
|
|
if q.dmlStream == nil {
|
|
|
|
return errors.New("null dml message stream in flow graph")
|
|
|
|
}
|
2022-10-25 05:23:30 +00:00
|
|
|
q.dmlStream.AsConsumer([]string{channel}, subName, mqwrapper.SubscriptionPositionLatest)
|
2022-11-03 07:03:35 +00:00
|
|
|
log.Info("query node flow graph consumes from latest",
|
|
|
|
zap.Int64("collectionID", q.collectionID),
|
|
|
|
zap.String("pchannel", channel),
|
|
|
|
zap.String("vchannel", q.vchannel),
|
|
|
|
zap.String("subName", subName),
|
2021-11-20 23:33:14 +00:00
|
|
|
)
|
2022-03-15 13:51:21 +00:00
|
|
|
q.consumerCnt++
|
2022-11-04 06:25:38 +00:00
|
|
|
metrics.QueryNodeNumConsumers.WithLabelValues(fmt.Sprint(paramtable.GetNodeID())).Inc()
|
2021-11-20 23:33:14 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-12-22 12:25:46 +00:00
|
|
|
// seekQueryNodeFlowGraph would seek by position
|
2022-10-25 05:23:30 +00:00
|
|
|
func (q *queryNodeFlowGraph) consumeFlowGraphFromPosition(position *internalpb.MsgPosition) error {
|
|
|
|
q.dmlStream.AsConsumer([]string{position.ChannelName}, position.MsgGroup, mqwrapper.SubscriptionPositionUnknown)
|
2022-11-03 07:03:35 +00:00
|
|
|
|
|
|
|
start := time.Now()
|
2021-06-09 03:37:55 +00:00
|
|
|
err := q.dmlStream.Seek([]*internalpb.MsgPosition{position})
|
2022-10-19 05:21:31 +00:00
|
|
|
|
|
|
|
ts, _ := tsoutil.ParseTS(position.GetTimestamp())
|
2022-11-03 07:03:35 +00:00
|
|
|
log.Info("query node flow graph seeks from position",
|
2022-10-19 05:21:31 +00:00
|
|
|
zap.Int64("collectionID", q.collectionID),
|
2022-11-03 07:03:35 +00:00
|
|
|
zap.String("pchannel", position.ChannelName),
|
|
|
|
zap.String("vchannel", q.vchannel),
|
2022-10-19 05:21:31 +00:00
|
|
|
zap.Time("checkpointTs", ts),
|
|
|
|
zap.Duration("tsLag", time.Since(ts)),
|
2022-11-03 07:03:35 +00:00
|
|
|
zap.Duration("elapse", time.Since(start)),
|
2021-06-15 12:06:10 +00:00
|
|
|
)
|
2022-03-15 13:51:21 +00:00
|
|
|
q.consumerCnt++
|
2022-11-04 06:25:38 +00:00
|
|
|
metrics.QueryNodeNumConsumers.WithLabelValues(fmt.Sprint(paramtable.GetNodeID())).Inc()
|
2021-06-09 03:37:55 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2021-12-23 13:50:15 +00:00
|
|
|
// close would close queryNodeFlowGraph
|
2021-06-09 03:37:55 +00:00
|
|
|
func (q *queryNodeFlowGraph) close() {
|
|
|
|
q.cancel()
|
|
|
|
q.flowGraph.Close()
|
2022-03-15 13:51:21 +00:00
|
|
|
if q.dmlStream != nil && q.consumerCnt > 0 {
|
2022-11-04 06:25:38 +00:00
|
|
|
metrics.QueryNodeNumConsumers.WithLabelValues(fmt.Sprint(paramtable.GetNodeID())).Sub(float64(q.consumerCnt))
|
2022-03-15 13:51:21 +00:00
|
|
|
}
|
2022-05-07 02:27:51 +00:00
|
|
|
log.Info("stop query node flow graph",
|
2022-11-03 07:03:35 +00:00
|
|
|
zap.Int64("collectionID", q.collectionID),
|
|
|
|
zap.String("vchannel", q.vchannel),
|
2021-06-09 03:37:55 +00:00
|
|
|
)
|
2022-11-07 02:15:02 +00:00
|
|
|
|
|
|
|
metrics.CleanupQueryNodeCollectionMetrics(paramtable.GetNodeID(), q.collectionID)
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|