mirror of https://github.com/milvus-io/milvus.git
385 lines
11 KiB
Go
385 lines
11 KiB
Go
package writebuffer
|
|
|
|
import (
|
|
"context"
|
|
"testing"
|
|
|
|
"github.com/stretchr/testify/mock"
|
|
"github.com/stretchr/testify/suite"
|
|
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/commonpb"
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/msgpb"
|
|
"github.com/milvus-io/milvus-proto/go-api/v2/schemapb"
|
|
"github.com/milvus-io/milvus/internal/allocator"
|
|
"github.com/milvus-io/milvus/internal/flushcommon/metacache"
|
|
"github.com/milvus-io/milvus/internal/flushcommon/metacache/pkoracle"
|
|
"github.com/milvus-io/milvus/internal/flushcommon/syncmgr"
|
|
"github.com/milvus-io/milvus/internal/proto/datapb"
|
|
"github.com/milvus-io/milvus/pkg/common"
|
|
"github.com/milvus-io/milvus/pkg/util/conc"
|
|
"github.com/milvus-io/milvus/pkg/util/merr"
|
|
"github.com/milvus-io/milvus/pkg/util/paramtable"
|
|
)
|
|
|
|
type WriteBufferSuite struct {
|
|
suite.Suite
|
|
collID int64
|
|
channelName string
|
|
collSchema *schemapb.CollectionSchema
|
|
wb *writeBufferBase
|
|
syncMgr *syncmgr.MockSyncManager
|
|
metacache *metacache.MockMetaCache
|
|
}
|
|
|
|
func (s *WriteBufferSuite) SetupSuite() {
|
|
paramtable.Get().Init(paramtable.NewBaseTable())
|
|
s.collID = 100
|
|
s.collSchema = &schemapb.CollectionSchema{
|
|
Name: "wb_base_collection",
|
|
Fields: []*schemapb.FieldSchema{
|
|
{FieldID: 100, DataType: schemapb.DataType_Int64, IsPrimaryKey: true, Name: "pk"},
|
|
{FieldID: 101, DataType: schemapb.DataType_FloatVector, TypeParams: []*commonpb.KeyValuePair{
|
|
{Key: common.DimKey, Value: "128"},
|
|
}},
|
|
},
|
|
}
|
|
s.channelName = "by-dev-rootcoord-dml_0v0"
|
|
}
|
|
|
|
func (s *WriteBufferSuite) SetupTest() {
|
|
s.syncMgr = syncmgr.NewMockSyncManager(s.T())
|
|
s.metacache = metacache.NewMockMetaCache(s.T())
|
|
s.metacache.EXPECT().Schema().Return(s.collSchema).Maybe()
|
|
s.metacache.EXPECT().Collection().Return(s.collID).Maybe()
|
|
var err error
|
|
s.wb, err = newWriteBufferBase(s.channelName, s.metacache, s.syncMgr, &writeBufferOption{
|
|
pkStatsFactory: func(vchannel *datapb.SegmentInfo) pkoracle.PkStat {
|
|
return pkoracle.NewBloomFilterSet()
|
|
},
|
|
})
|
|
s.Require().NoError(err)
|
|
}
|
|
|
|
func (s *WriteBufferSuite) TestDefaultOption() {
|
|
s.Run("default BFPkOracle", func() {
|
|
paramtable.Get().Save(paramtable.Get().DataCoordCfg.EnableLevelZeroSegment.Key, "false")
|
|
defer paramtable.Get().Reset(paramtable.Get().DataCoordCfg.EnableLevelZeroSegment.Key)
|
|
wb, err := NewWriteBuffer(s.channelName, s.metacache, s.syncMgr)
|
|
s.NoError(err)
|
|
_, ok := wb.(*bfWriteBuffer)
|
|
s.True(ok)
|
|
})
|
|
|
|
s.Run("default L0Delta policy", func() {
|
|
paramtable.Get().Save(paramtable.Get().DataCoordCfg.EnableLevelZeroSegment.Key, "true")
|
|
defer paramtable.Get().Reset(paramtable.Get().DataCoordCfg.EnableLevelZeroSegment.Key)
|
|
wb, err := NewWriteBuffer(s.channelName, s.metacache, s.syncMgr, WithIDAllocator(allocator.NewMockGIDAllocator()))
|
|
s.NoError(err)
|
|
_, ok := wb.(*l0WriteBuffer)
|
|
s.True(ok)
|
|
})
|
|
}
|
|
|
|
func (s *WriteBufferSuite) TestWriteBufferType() {
|
|
wb, err := NewWriteBuffer(s.channelName, s.metacache, s.syncMgr, WithDeletePolicy(DeletePolicyBFPkOracle))
|
|
s.NoError(err)
|
|
|
|
_, ok := wb.(*bfWriteBuffer)
|
|
s.True(ok)
|
|
|
|
wb, err = NewWriteBuffer(s.channelName, s.metacache, s.syncMgr, WithDeletePolicy(DeletePolicyL0Delta), WithIDAllocator(allocator.NewMockGIDAllocator()))
|
|
s.NoError(err)
|
|
_, ok = wb.(*l0WriteBuffer)
|
|
s.True(ok)
|
|
|
|
_, err = NewWriteBuffer(s.channelName, s.metacache, s.syncMgr, WithDeletePolicy(""))
|
|
s.Error(err)
|
|
}
|
|
|
|
func (s *WriteBufferSuite) TestHasSegment() {
|
|
segmentID := int64(1001)
|
|
|
|
s.False(s.wb.HasSegment(segmentID))
|
|
|
|
s.wb.getOrCreateBuffer(segmentID)
|
|
|
|
s.True(s.wb.HasSegment(segmentID))
|
|
}
|
|
|
|
func (s *WriteBufferSuite) TestFlushSegments() {
|
|
segmentID := int64(1001)
|
|
|
|
s.metacache.EXPECT().UpdateSegments(mock.Anything, mock.Anything, mock.Anything).Return()
|
|
s.metacache.EXPECT().GetSegmentByID(mock.Anything, mock.Anything, mock.Anything).Return(nil, true)
|
|
|
|
wb, err := NewWriteBuffer(s.channelName, s.metacache, s.syncMgr, WithDeletePolicy(DeletePolicyBFPkOracle))
|
|
s.NoError(err)
|
|
|
|
err = wb.SealSegments(context.Background(), []int64{segmentID})
|
|
s.NoError(err)
|
|
}
|
|
|
|
func (s *WriteBufferSuite) TestGetCheckpoint() {
|
|
s.Run("use_consume_cp", func() {
|
|
s.wb.checkpoint = &msgpb.MsgPosition{
|
|
Timestamp: 1000,
|
|
}
|
|
|
|
checkpoint := s.wb.GetCheckpoint()
|
|
s.EqualValues(1000, checkpoint.GetTimestamp())
|
|
})
|
|
|
|
s.Run("use_syncing_segment_cp", func() {
|
|
s.wb.checkpoint = &msgpb.MsgPosition{
|
|
Timestamp: 1000,
|
|
}
|
|
|
|
s.wb.syncCheckpoint.Add(1, &msgpb.MsgPosition{Timestamp: 500}, "syncing segments")
|
|
defer s.wb.syncCheckpoint.Remove(1, 500)
|
|
|
|
checkpoint := s.wb.GetCheckpoint()
|
|
s.EqualValues(500, checkpoint.GetTimestamp())
|
|
})
|
|
|
|
s.Run("use_segment_buffer_min", func() {
|
|
s.wb.checkpoint = &msgpb.MsgPosition{
|
|
Timestamp: 1000,
|
|
}
|
|
|
|
s.wb.syncCheckpoint.Add(1, &msgpb.MsgPosition{Timestamp: 500}, "syncing segments")
|
|
defer s.wb.syncCheckpoint.Remove(1, 500)
|
|
|
|
buf1, err := newSegmentBuffer(2, s.collSchema)
|
|
s.Require().NoError(err)
|
|
buf1.insertBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 440,
|
|
}
|
|
buf1.deltaBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 400,
|
|
}
|
|
buf2, err := newSegmentBuffer(3, s.collSchema)
|
|
s.Require().NoError(err)
|
|
buf2.insertBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 550,
|
|
}
|
|
buf2.deltaBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 600,
|
|
}
|
|
|
|
s.wb.mut.Lock()
|
|
s.wb.buffers[2] = buf1
|
|
s.wb.buffers[3] = buf2
|
|
s.wb.mut.Unlock()
|
|
|
|
defer func() {
|
|
s.wb.mut.Lock()
|
|
defer s.wb.mut.Unlock()
|
|
s.wb.buffers = make(map[int64]*segmentBuffer)
|
|
}()
|
|
|
|
checkpoint := s.wb.GetCheckpoint()
|
|
s.EqualValues(400, checkpoint.GetTimestamp())
|
|
})
|
|
|
|
s.Run("sync_mgr_smaller", func() {
|
|
s.wb.checkpoint = &msgpb.MsgPosition{
|
|
Timestamp: 1000,
|
|
}
|
|
|
|
s.wb.syncCheckpoint.Add(1, &msgpb.MsgPosition{Timestamp: 300}, "syncing segments")
|
|
defer s.wb.syncCheckpoint.Remove(1, 300)
|
|
|
|
buf1, err := newSegmentBuffer(2, s.collSchema)
|
|
s.Require().NoError(err)
|
|
buf1.insertBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 440,
|
|
}
|
|
buf1.deltaBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 400,
|
|
}
|
|
buf2, err := newSegmentBuffer(3, s.collSchema)
|
|
s.Require().NoError(err)
|
|
buf2.insertBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 550,
|
|
}
|
|
buf2.deltaBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 600,
|
|
}
|
|
|
|
s.wb.mut.Lock()
|
|
s.wb.buffers[2] = buf1
|
|
s.wb.buffers[3] = buf2
|
|
s.wb.mut.Unlock()
|
|
|
|
defer func() {
|
|
s.wb.mut.Lock()
|
|
defer s.wb.mut.Unlock()
|
|
s.wb.buffers = make(map[int64]*segmentBuffer)
|
|
}()
|
|
|
|
checkpoint := s.wb.GetCheckpoint()
|
|
s.EqualValues(300, checkpoint.GetTimestamp())
|
|
})
|
|
|
|
s.Run("segment_buffer_smaller", func() {
|
|
s.wb.checkpoint = &msgpb.MsgPosition{
|
|
Timestamp: 1000,
|
|
}
|
|
|
|
s.wb.syncCheckpoint.Add(1, &msgpb.MsgPosition{Timestamp: 800}, "syncing segments")
|
|
defer s.wb.syncCheckpoint.Remove(1, 800)
|
|
|
|
buf1, err := newSegmentBuffer(2, s.collSchema)
|
|
s.Require().NoError(err)
|
|
buf1.insertBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 440,
|
|
}
|
|
buf1.deltaBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 400,
|
|
}
|
|
buf2, err := newSegmentBuffer(3, s.collSchema)
|
|
s.Require().NoError(err)
|
|
buf2.insertBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 550,
|
|
}
|
|
buf2.deltaBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 600,
|
|
}
|
|
|
|
s.wb.mut.Lock()
|
|
s.wb.buffers[2] = buf1
|
|
s.wb.buffers[3] = buf2
|
|
s.wb.mut.Unlock()
|
|
|
|
defer func() {
|
|
s.wb.mut.Lock()
|
|
defer s.wb.mut.Unlock()
|
|
s.wb.buffers = make(map[int64]*segmentBuffer)
|
|
}()
|
|
|
|
checkpoint := s.wb.GetCheckpoint()
|
|
s.EqualValues(400, checkpoint.GetTimestamp())
|
|
})
|
|
}
|
|
|
|
func (s *WriteBufferSuite) TestSyncSegmentsError() {
|
|
wb, err := newWriteBufferBase(s.channelName, s.metacache, s.syncMgr, &writeBufferOption{
|
|
pkStatsFactory: func(vchannel *datapb.SegmentInfo) pkoracle.PkStat {
|
|
return pkoracle.NewBloomFilterSet()
|
|
},
|
|
})
|
|
s.Require().NoError(err)
|
|
|
|
serializer := syncmgr.NewMockSerializer(s.T())
|
|
|
|
wb.serializer = serializer
|
|
|
|
segment := metacache.NewSegmentInfo(&datapb.SegmentInfo{
|
|
ID: 1,
|
|
}, nil)
|
|
s.metacache.EXPECT().GetSegmentByID(int64(1)).Return(segment, true)
|
|
s.metacache.EXPECT().UpdateSegments(mock.Anything, mock.Anything).Return()
|
|
|
|
s.Run("segment_not_found", func() {
|
|
serializer.EXPECT().EncodeBuffer(mock.Anything, mock.Anything).Return(nil, merr.WrapErrSegmentNotFound(1)).Once()
|
|
s.NotPanics(func() {
|
|
wb.syncSegments(context.Background(), []int64{1})
|
|
})
|
|
})
|
|
|
|
s.Run("other_err", func() {
|
|
serializer.EXPECT().EncodeBuffer(mock.Anything, mock.Anything).Return(nil, merr.WrapErrServiceInternal("mocked")).Once()
|
|
s.Panics(func() {
|
|
wb.syncSegments(context.Background(), []int64{1})
|
|
})
|
|
})
|
|
}
|
|
|
|
func (s *WriteBufferSuite) TestEvictBuffer() {
|
|
wb, err := newWriteBufferBase(s.channelName, s.metacache, s.syncMgr, &writeBufferOption{
|
|
pkStatsFactory: func(vchannel *datapb.SegmentInfo) pkoracle.PkStat {
|
|
return pkoracle.NewBloomFilterSet()
|
|
},
|
|
})
|
|
s.Require().NoError(err)
|
|
|
|
serializer := syncmgr.NewMockSerializer(s.T())
|
|
|
|
wb.serializer = serializer
|
|
|
|
s.Run("no_checkpoint", func() {
|
|
wb.mut.Lock()
|
|
wb.buffers[100] = &segmentBuffer{}
|
|
wb.mut.Unlock()
|
|
defer func() {
|
|
wb.mut.Lock()
|
|
defer wb.mut.Unlock()
|
|
wb.buffers = make(map[int64]*segmentBuffer)
|
|
}()
|
|
|
|
wb.EvictBuffer(GetOldestBufferPolicy(1))
|
|
|
|
serializer.AssertNotCalled(s.T(), "EncodeBuffer")
|
|
})
|
|
|
|
s.Run("trigger_sync", func() {
|
|
buf1, err := newSegmentBuffer(2, s.collSchema)
|
|
s.Require().NoError(err)
|
|
buf1.insertBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 440,
|
|
}
|
|
buf1.deltaBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 400,
|
|
}
|
|
buf2, err := newSegmentBuffer(3, s.collSchema)
|
|
s.Require().NoError(err)
|
|
buf2.insertBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 550,
|
|
}
|
|
buf2.deltaBuffer.startPos = &msgpb.MsgPosition{
|
|
Timestamp: 600,
|
|
}
|
|
|
|
wb.mut.Lock()
|
|
wb.buffers[2] = buf1
|
|
wb.buffers[3] = buf2
|
|
wb.checkpoint = &msgpb.MsgPosition{Timestamp: 100}
|
|
wb.mut.Unlock()
|
|
|
|
segment := metacache.NewSegmentInfo(&datapb.SegmentInfo{
|
|
ID: 2,
|
|
}, nil)
|
|
s.metacache.EXPECT().GetSegmentByID(int64(2)).Return(segment, true)
|
|
s.metacache.EXPECT().UpdateSegments(mock.Anything, mock.Anything).Return()
|
|
serializer.EXPECT().EncodeBuffer(mock.Anything, mock.Anything).Return(syncmgr.NewSyncTask(), nil)
|
|
s.syncMgr.EXPECT().SyncData(mock.Anything, mock.Anything, mock.Anything).Return(conc.Go[struct{}](func() (struct{}, error) {
|
|
return struct{}{}, nil
|
|
}))
|
|
defer func() {
|
|
s.wb.mut.Lock()
|
|
defer s.wb.mut.Unlock()
|
|
s.wb.buffers = make(map[int64]*segmentBuffer)
|
|
}()
|
|
wb.EvictBuffer(GetOldestBufferPolicy(1))
|
|
})
|
|
}
|
|
|
|
func (s *WriteBufferSuite) TestDropPartitions() {
|
|
wb, err := newWriteBufferBase(s.channelName, s.metacache, s.syncMgr, &writeBufferOption{
|
|
pkStatsFactory: func(vchannel *datapb.SegmentInfo) pkoracle.PkStat {
|
|
return pkoracle.NewBloomFilterSet()
|
|
},
|
|
})
|
|
s.Require().NoError(err)
|
|
|
|
segIDs := []int64{1, 2, 3}
|
|
s.metacache.EXPECT().GetSegmentIDsBy(mock.Anything).Return(segIDs).Once()
|
|
s.metacache.EXPECT().UpdateSegments(mock.AnythingOfType("metacache.SegmentAction"), metacache.WithSegmentIDs(segIDs...)).Return().Once()
|
|
|
|
wb.dropPartitions([]int64{100, 101})
|
|
}
|
|
|
|
func TestWriteBufferBase(t *testing.T) {
|
|
suite.Run(t, new(WriteBufferSuite))
|
|
}
|