2021-04-19 07:16:33 +00:00
|
|
|
// Copyright (C) 2019-2020 Zilliz. All rights reserved.
|
|
|
|
//
|
|
|
|
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance
|
|
|
|
// with the License. You may obtain a copy of the License at
|
|
|
|
//
|
|
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
//
|
|
|
|
// Unless required by applicable law or agreed to in writing, software distributed under the License
|
|
|
|
// is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
|
|
|
|
// or implied. See the License for the specific language governing permissions and limitations under the License.
|
|
|
|
|
2021-01-19 03:37:16 +00:00
|
|
|
package datanode
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
2021-05-20 10:38:45 +00:00
|
|
|
"fmt"
|
2021-01-19 03:37:16 +00:00
|
|
|
"math"
|
2021-05-20 10:38:45 +00:00
|
|
|
"path"
|
|
|
|
"sync"
|
2021-01-19 03:37:16 +00:00
|
|
|
"testing"
|
|
|
|
"time"
|
|
|
|
|
2021-05-20 10:38:45 +00:00
|
|
|
"github.com/stretchr/testify/assert"
|
2021-01-19 03:37:16 +00:00
|
|
|
"github.com/stretchr/testify/require"
|
2021-05-26 04:09:03 +00:00
|
|
|
"go.uber.org/zap"
|
2021-01-19 03:37:16 +00:00
|
|
|
|
2021-05-20 10:38:45 +00:00
|
|
|
memkv "github.com/milvus-io/milvus/internal/kv/mem"
|
2021-05-26 04:09:03 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/log"
|
2021-04-22 06:45:57 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/msgstream"
|
2021-05-20 10:38:45 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/commonpb"
|
2021-05-26 04:09:03 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/datapb"
|
2021-05-20 10:38:45 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/etcdpb"
|
2021-04-22 06:45:57 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/internalpb"
|
2021-05-20 10:38:45 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/proto/schemapb"
|
|
|
|
"github.com/milvus-io/milvus/internal/storage"
|
2021-04-22 06:45:57 +00:00
|
|
|
"github.com/milvus-io/milvus/internal/util/flowgraph"
|
2021-01-19 03:37:16 +00:00
|
|
|
)
|
|
|
|
|
2021-01-21 01:55:25 +00:00
|
|
|
func TestFlowGraphInsertBufferNode_Operate(t *testing.T) {
|
2021-01-19 03:37:16 +00:00
|
|
|
const ctxTimeInMillisecond = 2000
|
|
|
|
const closeWithDeadline = false
|
|
|
|
var ctx context.Context
|
|
|
|
|
|
|
|
if closeWithDeadline {
|
|
|
|
var cancel context.CancelFunc
|
|
|
|
d := time.Now().Add(ctxTimeInMillisecond * time.Millisecond)
|
|
|
|
ctx, cancel = context.WithDeadline(context.Background(), d)
|
|
|
|
defer cancel()
|
|
|
|
} else {
|
|
|
|
ctx = context.Background()
|
|
|
|
}
|
|
|
|
|
|
|
|
testPath := "/test/datanode/root/meta"
|
|
|
|
err := clearEtcd(testPath)
|
|
|
|
require.NoError(t, err)
|
|
|
|
Params.MetaRootPath = testPath
|
|
|
|
|
2021-01-24 13:20:11 +00:00
|
|
|
Factory := &MetaFactory{}
|
2021-01-22 11:36:09 +00:00
|
|
|
collMeta := Factory.CollectionMetaFactory(UniqueID(0), "coll1")
|
2021-01-19 03:37:16 +00:00
|
|
|
|
|
|
|
replica := newReplica()
|
2021-01-25 10:33:10 +00:00
|
|
|
err = replica.addCollection(collMeta.ID, collMeta.Schema)
|
2021-01-19 03:37:16 +00:00
|
|
|
require.NoError(t, err)
|
2021-03-30 01:47:27 +00:00
|
|
|
err = replica.addSegment(1, collMeta.ID, 0, Params.InsertChannelNames[0])
|
|
|
|
require.NoError(t, err)
|
2021-01-19 03:37:16 +00:00
|
|
|
|
2021-04-02 05:48:25 +00:00
|
|
|
msFactory := msgstream.NewPmsFactory()
|
2021-02-08 06:30:54 +00:00
|
|
|
m := map[string]interface{}{
|
|
|
|
"receiveBufSize": 1024,
|
|
|
|
"pulsarAddress": Params.PulsarAddress,
|
|
|
|
"pulsarBufSize": 1024}
|
|
|
|
err = msFactory.SetParams(m)
|
|
|
|
assert.Nil(t, err)
|
|
|
|
|
2021-05-18 11:45:00 +00:00
|
|
|
iBNode := newInsertBufferNode(ctx, newBinlogMeta(), replica, msFactory, NewAllocatorFactory())
|
2021-05-25 07:35:37 +00:00
|
|
|
|
2021-05-26 04:09:03 +00:00
|
|
|
ddlFlushedCh := make(chan []*datapb.DDLBinlogMeta)
|
|
|
|
dmlFlushedCh := make(chan []*datapb.ID2PathList)
|
2021-05-25 07:35:37 +00:00
|
|
|
|
|
|
|
inMsg := genInsertMsg(ddlFlushedCh, dmlFlushedCh)
|
2021-01-19 03:37:16 +00:00
|
|
|
var iMsg flowgraph.Msg = &inMsg
|
2021-03-25 06:41:46 +00:00
|
|
|
iBNode.Operate([]flowgraph.Msg{iMsg})
|
2021-05-25 07:35:37 +00:00
|
|
|
|
|
|
|
isflushed := <-dmlFlushedCh
|
2021-05-26 04:09:03 +00:00
|
|
|
assert.NotNil(t, isflushed)
|
|
|
|
log.Debug("DML binlog paths", zap.Any("paths", isflushed))
|
2021-01-19 03:37:16 +00:00
|
|
|
}
|
|
|
|
|
2021-05-26 04:09:03 +00:00
|
|
|
func genInsertMsg(ddlFlushedCh chan<- []*datapb.DDLBinlogMeta, dmlFlushedCh chan<- []*datapb.ID2PathList) insertMsg {
|
2021-01-19 03:37:16 +00:00
|
|
|
|
|
|
|
timeRange := TimeRange{
|
|
|
|
timestampMin: 0,
|
|
|
|
timestampMax: math.MaxUint64,
|
|
|
|
}
|
|
|
|
|
2021-03-16 09:55:42 +00:00
|
|
|
startPos := []*internalpb.MsgPosition{
|
|
|
|
{
|
2021-03-30 01:47:27 +00:00
|
|
|
ChannelName: Params.InsertChannelNames[0],
|
2021-03-27 01:46:54 +00:00
|
|
|
MsgID: make([]byte, 0),
|
2021-03-16 09:55:42 +00:00
|
|
|
Timestamp: 0,
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
2021-01-19 03:37:16 +00:00
|
|
|
var iMsg = &insertMsg{
|
|
|
|
insertMessages: make([]*msgstream.InsertMsg, 0),
|
2021-05-25 07:35:37 +00:00
|
|
|
// flushMessages: make([]*flushMsg, 0),
|
2021-01-19 03:37:16 +00:00
|
|
|
timeRange: TimeRange{
|
|
|
|
timestampMin: timeRange.timestampMin,
|
|
|
|
timestampMax: timeRange.timestampMax,
|
|
|
|
},
|
2021-03-16 09:55:42 +00:00
|
|
|
startPositions: startPos,
|
|
|
|
endPositions: startPos,
|
2021-01-19 03:37:16 +00:00
|
|
|
}
|
|
|
|
|
2021-02-03 09:30:10 +00:00
|
|
|
dataFactory := NewDataFactory()
|
|
|
|
iMsg.insertMessages = append(iMsg.insertMessages, dataFactory.GetMsgStreamInsertMsgs(2)...)
|
2021-01-19 03:37:16 +00:00
|
|
|
|
2021-05-25 07:35:37 +00:00
|
|
|
iMsg.flushMessage = &flushMsg{
|
2021-01-22 01:36:40 +00:00
|
|
|
msgID: 1,
|
2021-01-26 06:46:54 +00:00
|
|
|
timestamp: 2000,
|
2021-05-25 07:35:37 +00:00
|
|
|
segmentID: UniqueID(1),
|
2021-01-22 01:36:40 +00:00
|
|
|
collectionID: UniqueID(1),
|
2021-05-25 07:35:37 +00:00
|
|
|
ddlFlushedCh: ddlFlushedCh,
|
|
|
|
dmlFlushedCh: dmlFlushedCh,
|
2021-01-19 03:37:16 +00:00
|
|
|
}
|
2021-01-22 01:36:40 +00:00
|
|
|
|
2021-01-19 03:37:16 +00:00
|
|
|
return *iMsg
|
|
|
|
|
|
|
|
}
|
2021-05-20 10:38:45 +00:00
|
|
|
|
|
|
|
func TestFlushSegmentTxn(t *testing.T) {
|
|
|
|
idAllocMock := NewAllocatorFactory(1)
|
|
|
|
mockMinIO := memkv.NewMemoryKV()
|
|
|
|
|
|
|
|
segmentID, _ := idAllocMock.allocID()
|
|
|
|
partitionID, _ := idAllocMock.allocID()
|
|
|
|
collectionID, _ := idAllocMock.allocID()
|
|
|
|
fmt.Printf("generate segmentID, partitionID, collectionID: %v, %v, %v\n",
|
|
|
|
segmentID, partitionID, collectionID)
|
|
|
|
|
|
|
|
collMeta := genCollectionMeta(collectionID, "test_flush_segment_txn")
|
|
|
|
flushMap := sync.Map{}
|
|
|
|
flushMeta := newBinlogMeta()
|
|
|
|
|
|
|
|
finishCh := make(chan map[UniqueID]string)
|
|
|
|
|
|
|
|
insertData := &InsertData{
|
|
|
|
Data: make(map[storage.FieldID]storage.FieldData),
|
|
|
|
}
|
|
|
|
insertData.Data[0] = &storage.Int64FieldData{
|
|
|
|
NumRows: 10,
|
|
|
|
Data: []int64{0, 1, 2, 3, 4, 5, 6, 7, 8, 9},
|
|
|
|
}
|
|
|
|
insertData.Data[1] = &storage.Int64FieldData{
|
|
|
|
NumRows: 10,
|
|
|
|
Data: []int64{1, 2, 3, 4, 5, 6, 7, 8, 9, 10},
|
|
|
|
}
|
|
|
|
insertData.Data[107] = &storage.FloatFieldData{
|
|
|
|
NumRows: 10,
|
|
|
|
Data: make([]float32, 10),
|
|
|
|
}
|
|
|
|
flushMap.Store(segmentID, insertData)
|
|
|
|
|
|
|
|
go func(wait <-chan map[UniqueID]string) {
|
|
|
|
field2Path := <-wait
|
|
|
|
assert.NotNil(t, field2Path)
|
|
|
|
}(finishCh)
|
|
|
|
|
|
|
|
flushSegment(collMeta,
|
|
|
|
segmentID,
|
|
|
|
partitionID,
|
|
|
|
collectionID,
|
|
|
|
&flushMap,
|
|
|
|
mockMinIO,
|
|
|
|
finishCh,
|
|
|
|
idAllocMock)
|
|
|
|
|
|
|
|
k, _ := flushMeta.genKey(false, collectionID, partitionID, segmentID, 0)
|
|
|
|
key := path.Join(Params.StatsBinlogRootPath, k)
|
|
|
|
_, values, _ := mockMinIO.LoadWithPrefix(key)
|
|
|
|
assert.Equal(t, len(values), 1)
|
|
|
|
assert.Equal(t, values[0], `{"max":9,"min":0}`)
|
|
|
|
}
|
|
|
|
|
|
|
|
func genCollectionMeta(collectionID UniqueID, collectionName string) *etcdpb.CollectionMeta {
|
|
|
|
sch := schemapb.CollectionSchema{
|
|
|
|
Name: collectionName,
|
|
|
|
Description: "test collection by meta factory",
|
|
|
|
AutoID: true,
|
|
|
|
Fields: []*schemapb.FieldSchema{
|
|
|
|
{
|
|
|
|
FieldID: 0,
|
|
|
|
Name: "RowID",
|
|
|
|
Description: "RowID field",
|
|
|
|
DataType: schemapb.DataType_Int64,
|
|
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
|
|
{
|
|
|
|
Key: "f0_tk1",
|
|
|
|
Value: "f0_tv1",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
FieldID: 1,
|
|
|
|
Name: "Timestamp",
|
|
|
|
Description: "Timestamp field",
|
|
|
|
DataType: schemapb.DataType_Int64,
|
|
|
|
TypeParams: []*commonpb.KeyValuePair{
|
|
|
|
{
|
|
|
|
Key: "f1_tk1",
|
|
|
|
Value: "f1_tv1",
|
|
|
|
},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
{
|
|
|
|
FieldID: 107,
|
|
|
|
Name: "float32_field",
|
|
|
|
Description: "field 107",
|
|
|
|
DataType: schemapb.DataType_Float,
|
|
|
|
TypeParams: []*commonpb.KeyValuePair{},
|
|
|
|
IndexParams: []*commonpb.KeyValuePair{},
|
|
|
|
},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
collection := etcdpb.CollectionMeta{
|
|
|
|
ID: collectionID,
|
|
|
|
Schema: &sch,
|
|
|
|
CreateTime: Timestamp(1),
|
|
|
|
SegmentIDs: make([]UniqueID, 0),
|
|
|
|
PartitionIDs: []UniqueID{0},
|
|
|
|
}
|
|
|
|
return &collection
|
|
|
|
}
|