2021-12-01 14:28:08 +00:00
|
|
|
// Licensed to the LF AI & Data foundation under one
|
|
|
|
// or more contributor license agreements. See the NOTICE file
|
|
|
|
// distributed with this work for additional information
|
|
|
|
// regarding copyright ownership. The ASF licenses this file
|
|
|
|
// to you under the Apache License, Version 2.0 (the
|
|
|
|
// "License"); you may not use this file except in compliance
|
2021-06-09 03:37:55 +00:00
|
|
|
// with the License. You may obtain a copy of the License at
|
|
|
|
//
|
2021-12-01 14:28:08 +00:00
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
2021-06-09 03:37:55 +00:00
|
|
|
//
|
2021-12-01 14:28:08 +00:00
|
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
// See the License for the specific language governing permissions and
|
|
|
|
// limitations under the License.
|
2021-06-09 03:37:55 +00:00
|
|
|
|
|
|
|
package querynode
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"errors"
|
2022-03-02 06:49:55 +00:00
|
|
|
"fmt"
|
2021-06-09 03:37:55 +00:00
|
|
|
|
|
|
|
"go.uber.org/zap"
|
|
|
|
|
|
|
|
"github.com/milvus-io/milvus/internal/log"
|
2022-03-02 06:49:55 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/metrics"
|
2022-03-03 13:57:56 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/mq/msgstream"
|
|
|
|
"github.com/milvus-io/milvus/internal/mq/msgstream/mqwrapper"
|
2021-06-09 03:37:55 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/internalpb"
|
|
|
|
"github.com/milvus-io/milvus/internal/util/flowgraph"
|
|
|
|
)
|
|
|
|
|
2021-09-27 11:06:07 +00:00
|
|
|
// queryNodeFlowGraph is a TimeTickedFlowGraph in query node
|
2021-06-09 03:37:55 +00:00
|
|
|
type queryNodeFlowGraph struct {
|
|
|
|
ctx context.Context
|
|
|
|
cancel context.CancelFunc
|
|
|
|
collectionID UniqueID
|
2021-06-15 12:06:10 +00:00
|
|
|
channel Channel
|
2021-06-09 03:37:55 +00:00
|
|
|
flowGraph *flowgraph.TimeTickedFlowGraph
|
|
|
|
dmlStream msgstream.MsgStream
|
2022-03-15 13:51:21 +00:00
|
|
|
consumerCnt int
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2021-12-21 13:12:04 +00:00
|
|
|
// newQueryNodeFlowGraph returns a new queryNodeFlowGraph
|
2021-06-09 03:37:55 +00:00
|
|
|
func newQueryNodeFlowGraph(ctx context.Context,
|
|
|
|
collectionID UniqueID,
|
|
|
|
streamingReplica ReplicaInterface,
|
|
|
|
tSafeReplica TSafeReplicaInterface,
|
2021-06-15 12:06:10 +00:00
|
|
|
channel Channel,
|
2022-03-09 07:17:59 +00:00
|
|
|
factory msgstream.Factory) (*queryNodeFlowGraph, error) {
|
2021-06-09 03:37:55 +00:00
|
|
|
|
|
|
|
ctx1, cancel := context.WithCancel(ctx)
|
|
|
|
|
|
|
|
q := &queryNodeFlowGraph{
|
|
|
|
ctx: ctx1,
|
|
|
|
cancel: cancel,
|
|
|
|
collectionID: collectionID,
|
|
|
|
channel: channel,
|
|
|
|
flowGraph: flowgraph.NewTimeTickedFlowGraph(ctx1),
|
|
|
|
}
|
|
|
|
|
2022-04-27 02:01:47 +00:00
|
|
|
dmStreamNode, err := q.newDmInputNode(ctx1, factory, collectionID, channel)
|
2022-03-09 07:17:59 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2021-12-17 12:12:42 +00:00
|
|
|
var filterDmNode node = newFilteredDmNode(streamingReplica, collectionID)
|
2021-11-09 01:27:04 +00:00
|
|
|
var insertNode node = newInsertNode(streamingReplica)
|
2022-03-09 07:17:59 +00:00
|
|
|
var serviceTimeNode node = newServiceTimeNode(tSafeReplica, collectionID, channel)
|
2021-06-09 03:37:55 +00:00
|
|
|
|
|
|
|
q.flowGraph.AddNode(dmStreamNode)
|
|
|
|
q.flowGraph.AddNode(filterDmNode)
|
|
|
|
q.flowGraph.AddNode(insertNode)
|
|
|
|
q.flowGraph.AddNode(serviceTimeNode)
|
|
|
|
|
|
|
|
// dmStreamNode
|
2022-03-09 07:17:59 +00:00
|
|
|
err = q.flowGraph.SetEdges(dmStreamNode.Name(),
|
2021-06-09 03:37:55 +00:00
|
|
|
[]string{},
|
|
|
|
[]string{filterDmNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", dmStreamNode.Name(), err.Error())
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// filterDmNode
|
|
|
|
err = q.flowGraph.SetEdges(filterDmNode.Name(),
|
|
|
|
[]string{dmStreamNode.Name()},
|
|
|
|
[]string{insertNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", filterDmNode.Name(), err.Error())
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// insertNode
|
|
|
|
err = q.flowGraph.SetEdges(insertNode.Name(),
|
|
|
|
[]string{filterDmNode.Name()},
|
|
|
|
[]string{serviceTimeNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", insertNode.Name(), err.Error())
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// serviceTimeNode
|
|
|
|
err = q.flowGraph.SetEdges(serviceTimeNode.Name(),
|
|
|
|
[]string{insertNode.Name()},
|
|
|
|
[]string{},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", serviceTimeNode.Name(), err.Error())
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
return q, nil
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2021-12-21 13:13:55 +00:00
|
|
|
// newQueryNodeDeltaFlowGraph returns a new queryNodeFlowGraph
|
2021-11-06 03:02:58 +00:00
|
|
|
func newQueryNodeDeltaFlowGraph(ctx context.Context,
|
|
|
|
collectionID UniqueID,
|
|
|
|
historicalReplica ReplicaInterface,
|
|
|
|
tSafeReplica TSafeReplicaInterface,
|
|
|
|
channel Channel,
|
2022-03-09 07:17:59 +00:00
|
|
|
factory msgstream.Factory) (*queryNodeFlowGraph, error) {
|
2021-11-06 03:02:58 +00:00
|
|
|
|
|
|
|
ctx1, cancel := context.WithCancel(ctx)
|
|
|
|
|
|
|
|
q := &queryNodeFlowGraph{
|
|
|
|
ctx: ctx1,
|
|
|
|
cancel: cancel,
|
|
|
|
collectionID: collectionID,
|
|
|
|
channel: channel,
|
|
|
|
flowGraph: flowgraph.NewTimeTickedFlowGraph(ctx1),
|
|
|
|
}
|
|
|
|
|
2022-04-27 02:01:47 +00:00
|
|
|
dmStreamNode, err := q.newDmInputNode(ctx1, factory, collectionID, channel)
|
2022-03-09 07:17:59 +00:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2021-12-17 12:12:42 +00:00
|
|
|
var filterDeleteNode node = newFilteredDeleteNode(historicalReplica, collectionID)
|
2021-11-06 03:02:58 +00:00
|
|
|
var deleteNode node = newDeleteNode(historicalReplica)
|
2022-03-09 07:17:59 +00:00
|
|
|
var serviceTimeNode node = newServiceTimeNode(tSafeReplica, collectionID, channel)
|
2021-11-06 03:02:58 +00:00
|
|
|
|
|
|
|
q.flowGraph.AddNode(dmStreamNode)
|
|
|
|
q.flowGraph.AddNode(filterDeleteNode)
|
|
|
|
q.flowGraph.AddNode(deleteNode)
|
|
|
|
q.flowGraph.AddNode(serviceTimeNode)
|
|
|
|
|
|
|
|
// dmStreamNode
|
2022-03-09 07:17:59 +00:00
|
|
|
err = q.flowGraph.SetEdges(dmStreamNode.Name(),
|
2021-11-06 03:02:58 +00:00
|
|
|
[]string{},
|
|
|
|
[]string{filterDeleteNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", dmStreamNode.Name(), err.Error())
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// filterDmNode
|
|
|
|
err = q.flowGraph.SetEdges(filterDeleteNode.Name(),
|
|
|
|
[]string{dmStreamNode.Name()},
|
|
|
|
[]string{deleteNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", filterDeleteNode.Name(), err.Error())
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// insertNode
|
|
|
|
err = q.flowGraph.SetEdges(deleteNode.Name(),
|
|
|
|
[]string{filterDeleteNode.Name()},
|
|
|
|
[]string{serviceTimeNode.Name()},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", deleteNode.Name(), err.Error())
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
// serviceTimeNode
|
|
|
|
err = q.flowGraph.SetEdges(serviceTimeNode.Name(),
|
|
|
|
[]string{deleteNode.Name()},
|
|
|
|
[]string{},
|
|
|
|
)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, fmt.Errorf("set edges failed in node: %s, err = %s", serviceTimeNode.Name(), err.Error())
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
return q, nil
|
2021-11-06 03:02:58 +00:00
|
|
|
}
|
|
|
|
|
2021-12-21 13:15:49 +00:00
|
|
|
// newDmInputNode returns a new inputNode
|
2022-04-27 02:01:47 +00:00
|
|
|
func (q *queryNodeFlowGraph) newDmInputNode(ctx context.Context, factory msgstream.Factory, collectionID UniqueID, channel Channel) (*flowgraph.InputNode, error) {
|
2021-06-09 03:37:55 +00:00
|
|
|
insertStream, err := factory.NewTtMsgStream(ctx)
|
|
|
|
if err != nil {
|
2022-03-09 07:17:59 +00:00
|
|
|
return nil, err
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
q.dmlStream = insertStream
|
|
|
|
|
2021-12-23 10:39:11 +00:00
|
|
|
maxQueueLength := Params.QueryNodeCfg.FlowGraphMaxQueueLength
|
|
|
|
maxParallelism := Params.QueryNodeCfg.FlowGraphMaxParallelism
|
2022-04-27 02:01:47 +00:00
|
|
|
name := fmt.Sprintf("dmInputNode-query-%d-%s", collectionID, channel)
|
|
|
|
node := flowgraph.NewInputNode(insertStream, name, maxQueueLength, maxParallelism)
|
2022-03-09 07:17:59 +00:00
|
|
|
return node, nil
|
2021-06-09 03:37:55 +00:00
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
// consumeFlowGraph would consume by channel and subName
|
|
|
|
func (q *queryNodeFlowGraph) consumeFlowGraph(channel Channel, subName ConsumeSubName) error {
|
2021-06-09 03:37:55 +00:00
|
|
|
if q.dmlStream == nil {
|
|
|
|
return errors.New("null dml message stream in flow graph")
|
|
|
|
}
|
|
|
|
q.dmlStream.AsConsumer([]string{channel}, subName)
|
2022-05-07 02:27:51 +00:00
|
|
|
log.Info("query node flow graph consumes from pChannel",
|
2021-06-15 12:06:10 +00:00
|
|
|
zap.Any("collectionID", q.collectionID),
|
|
|
|
zap.Any("channel", channel),
|
2021-09-18 01:13:50 +00:00
|
|
|
zap.Any("subName", subName),
|
2021-06-15 12:06:10 +00:00
|
|
|
)
|
2022-03-15 13:51:21 +00:00
|
|
|
q.consumerCnt++
|
2022-04-24 14:03:44 +00:00
|
|
|
metrics.QueryNodeNumConsumers.WithLabelValues(fmt.Sprint(Params.QueryNodeCfg.GetNodeID())).Inc()
|
2021-06-09 03:37:55 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2022-03-09 07:17:59 +00:00
|
|
|
// consumeFlowGraphFromLatest would consume from latest by channel and subName
|
|
|
|
func (q *queryNodeFlowGraph) consumeFlowGraphFromLatest(channel Channel, subName ConsumeSubName) error {
|
2021-11-20 23:33:14 +00:00
|
|
|
if q.dmlStream == nil {
|
|
|
|
return errors.New("null dml message stream in flow graph")
|
|
|
|
}
|
2022-03-03 13:57:56 +00:00
|
|
|
q.dmlStream.AsConsumerWithPosition([]string{channel}, subName, mqwrapper.SubscriptionPositionLatest)
|
2022-05-07 02:27:51 +00:00
|
|
|
log.Info("query node flow graph consumes from pChannel",
|
2021-11-20 23:33:14 +00:00
|
|
|
zap.Any("collectionID", q.collectionID),
|
|
|
|
zap.Any("channel", channel),
|
|
|
|
zap.Any("subName", subName),
|
|
|
|
)
|
2022-03-15 13:51:21 +00:00
|
|
|
q.consumerCnt++
|
2022-04-24 14:03:44 +00:00
|
|
|
metrics.QueryNodeNumConsumers.WithLabelValues(fmt.Sprint(Params.QueryNodeCfg.GetNodeID())).Inc()
|
2021-11-20 23:33:14 +00:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-12-22 12:25:46 +00:00
|
|
|
// seekQueryNodeFlowGraph would seek by position
|
2021-06-09 03:37:55 +00:00
|
|
|
func (q *queryNodeFlowGraph) seekQueryNodeFlowGraph(position *internalpb.MsgPosition) error {
|
2021-06-10 06:32:51 +00:00
|
|
|
q.dmlStream.AsConsumer([]string{position.ChannelName}, position.MsgGroup)
|
2021-06-09 03:37:55 +00:00
|
|
|
err := q.dmlStream.Seek([]*internalpb.MsgPosition{position})
|
2022-05-07 02:27:51 +00:00
|
|
|
log.Info("query node flow graph seeks from pChannel",
|
2021-06-15 12:06:10 +00:00
|
|
|
zap.Any("collectionID", q.collectionID),
|
|
|
|
zap.Any("channel", position.ChannelName),
|
|
|
|
)
|
2022-03-15 13:51:21 +00:00
|
|
|
q.consumerCnt++
|
2022-04-24 14:03:44 +00:00
|
|
|
metrics.QueryNodeNumConsumers.WithLabelValues(fmt.Sprint(Params.QueryNodeCfg.GetNodeID())).Inc()
|
2021-06-09 03:37:55 +00:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
2021-12-23 13:50:15 +00:00
|
|
|
// close would close queryNodeFlowGraph
|
2021-06-09 03:37:55 +00:00
|
|
|
func (q *queryNodeFlowGraph) close() {
|
|
|
|
q.cancel()
|
|
|
|
q.flowGraph.Close()
|
2022-03-15 13:51:21 +00:00
|
|
|
if q.dmlStream != nil && q.consumerCnt > 0 {
|
2022-04-24 14:03:44 +00:00
|
|
|
metrics.QueryNodeNumConsumers.WithLabelValues(fmt.Sprint(Params.QueryNodeCfg.GetNodeID())).Sub(float64(q.consumerCnt))
|
2022-03-15 13:51:21 +00:00
|
|
|
}
|
2022-05-07 02:27:51 +00:00
|
|
|
log.Info("stop query node flow graph",
|
2021-06-09 03:37:55 +00:00
|
|
|
zap.Any("collectionID", q.collectionID),
|
|
|
|
zap.Any("channel", q.channel),
|
|
|
|
)
|
|
|
|
}
|