2021-01-15 07:28:54 +00:00
|
|
|
package querynodeimp
|
2020-08-25 07:45:19 +00:00
|
|
|
|
2020-08-29 09:42:41 +00:00
|
|
|
/*
|
|
|
|
|
2020-10-23 10:01:24 +00:00
|
|
|
#cgo CFLAGS: -I${SRCDIR}/../core/output/include
|
2020-08-29 09:42:41 +00:00
|
|
|
|
2020-10-31 07:11:47 +00:00
|
|
|
#cgo LDFLAGS: -L${SRCDIR}/../core/output/lib -lmilvus_segcore -Wl,-rpath=${SRCDIR}/../core/output/lib
|
2020-08-29 09:42:41 +00:00
|
|
|
|
2020-11-25 02:31:51 +00:00
|
|
|
#include "segcore/collection_c.h"
|
|
|
|
#include "segcore/plan_c.h"
|
|
|
|
#include "segcore/reduce_c.h"
|
2020-08-29 09:42:41 +00:00
|
|
|
*/
|
2020-08-25 07:45:19 +00:00
|
|
|
import "C"
|
2020-08-28 09:29:26 +00:00
|
|
|
import (
|
2020-11-04 09:58:43 +00:00
|
|
|
"strconv"
|
2021-01-12 10:03:24 +00:00
|
|
|
"sync"
|
2020-11-05 02:52:50 +00:00
|
|
|
"unsafe"
|
2020-11-04 09:58:43 +00:00
|
|
|
|
2020-11-09 08:27:11 +00:00
|
|
|
"github.com/stretchr/testify/assert"
|
|
|
|
|
2020-10-19 10:31:00 +00:00
|
|
|
"github.com/zilliztech/milvus-distributed/internal/errors"
|
2020-11-04 08:28:14 +00:00
|
|
|
"github.com/zilliztech/milvus-distributed/internal/proto/commonpb"
|
2020-08-28 09:29:26 +00:00
|
|
|
)
|
|
|
|
|
2021-01-12 10:03:24 +00:00
|
|
|
type indexParam = map[string]string
|
|
|
|
|
2020-08-25 07:45:19 +00:00
|
|
|
type Segment struct {
|
2021-01-13 02:40:46 +00:00
|
|
|
segmentPtr C.CSegmentBase
|
|
|
|
segmentID UniqueID
|
|
|
|
partitionTag string // TODO: use partitionID
|
|
|
|
collectionID UniqueID
|
|
|
|
lastMemSize int64
|
|
|
|
lastRowCount int64
|
|
|
|
|
|
|
|
rmMutex sync.Mutex // guards recentlyModified
|
2020-11-05 02:52:50 +00:00
|
|
|
recentlyModified bool
|
2021-01-13 02:40:46 +00:00
|
|
|
|
|
|
|
paramMutex sync.RWMutex // guards indexParam
|
|
|
|
indexParam map[int64]indexParam
|
2020-08-25 07:45:19 +00:00
|
|
|
}
|
|
|
|
|
2020-11-09 08:27:11 +00:00
|
|
|
func (s *Segment) ID() UniqueID {
|
|
|
|
return s.segmentID
|
|
|
|
}
|
|
|
|
|
2021-01-12 10:03:24 +00:00
|
|
|
func (s *Segment) SetRecentlyModified(modify bool) {
|
2021-01-13 02:40:46 +00:00
|
|
|
s.rmMutex.Lock()
|
|
|
|
defer s.rmMutex.Unlock()
|
2021-01-12 10:03:24 +00:00
|
|
|
s.recentlyModified = modify
|
|
|
|
}
|
|
|
|
|
|
|
|
func (s *Segment) GetRecentlyModified() bool {
|
2021-01-13 02:40:46 +00:00
|
|
|
s.rmMutex.Lock()
|
|
|
|
defer s.rmMutex.Unlock()
|
2021-01-12 10:03:24 +00:00
|
|
|
return s.recentlyModified
|
|
|
|
}
|
|
|
|
|
2020-11-09 08:27:11 +00:00
|
|
|
//-------------------------------------------------------------------------------------- constructor and destructor
|
2020-12-24 12:55:40 +00:00
|
|
|
func newSegment(collection *Collection, segmentID int64, partitionTag string, collectionID UniqueID) *Segment {
|
2020-11-09 08:27:11 +00:00
|
|
|
/*
|
|
|
|
CSegmentBase
|
|
|
|
newSegment(CPartition partition, unsigned long segment_id);
|
|
|
|
*/
|
2021-01-12 10:03:24 +00:00
|
|
|
initIndexParam := make(map[int64]indexParam)
|
2020-11-09 10:07:15 +00:00
|
|
|
segmentPtr := C.NewSegment(collection.collectionPtr, C.ulong(segmentID))
|
2020-12-24 12:55:40 +00:00
|
|
|
var newSegment = &Segment{
|
|
|
|
segmentPtr: segmentPtr,
|
|
|
|
segmentID: segmentID,
|
|
|
|
partitionTag: partitionTag,
|
|
|
|
collectionID: collectionID,
|
2021-01-12 10:03:24 +00:00
|
|
|
indexParam: initIndexParam,
|
2020-12-24 12:55:40 +00:00
|
|
|
}
|
2020-11-09 08:27:11 +00:00
|
|
|
|
|
|
|
return newSegment
|
|
|
|
}
|
|
|
|
|
|
|
|
func deleteSegment(segment *Segment) {
|
|
|
|
/*
|
|
|
|
void
|
|
|
|
deleteSegment(CSegmentBase segment);
|
|
|
|
*/
|
|
|
|
cPtr := segment.segmentPtr
|
|
|
|
C.DeleteSegment(cPtr)
|
|
|
|
}
|
|
|
|
|
|
|
|
//-------------------------------------------------------------------------------------- stats functions
|
2020-11-05 02:52:50 +00:00
|
|
|
func (s *Segment) getRowCount() int64 {
|
2020-09-21 10:16:06 +00:00
|
|
|
/*
|
2020-10-24 02:45:57 +00:00
|
|
|
long int
|
2020-11-05 02:52:50 +00:00
|
|
|
getRowCount(CSegmentBase c_segment);
|
2020-09-03 11:58:33 +00:00
|
|
|
*/
|
2020-11-09 08:27:11 +00:00
|
|
|
var rowCount = C.GetRowCount(s.segmentPtr)
|
2020-09-03 11:58:33 +00:00
|
|
|
return int64(rowCount)
|
2020-08-25 07:45:19 +00:00
|
|
|
}
|
|
|
|
|
2020-11-05 02:52:50 +00:00
|
|
|
func (s *Segment) getDeletedCount() int64 {
|
2020-09-21 10:16:06 +00:00
|
|
|
/*
|
2020-10-24 02:45:57 +00:00
|
|
|
long int
|
2020-11-05 02:52:50 +00:00
|
|
|
getDeletedCount(CSegmentBase c_segment);
|
2020-09-03 11:58:33 +00:00
|
|
|
*/
|
2020-11-09 08:27:11 +00:00
|
|
|
var deletedCount = C.GetDeletedCount(s.segmentPtr)
|
2020-09-03 11:58:33 +00:00
|
|
|
return int64(deletedCount)
|
|
|
|
}
|
|
|
|
|
2020-11-05 02:52:50 +00:00
|
|
|
func (s *Segment) getMemSize() int64 {
|
2020-09-21 10:16:06 +00:00
|
|
|
/*
|
2020-10-24 02:45:57 +00:00
|
|
|
long int
|
|
|
|
GetMemoryUsageInBytes(CSegmentBase c_segment);
|
2020-09-21 07:10:54 +00:00
|
|
|
*/
|
2020-11-09 08:27:11 +00:00
|
|
|
var memoryUsageInBytes = C.GetMemoryUsageInBytes(s.segmentPtr)
|
2020-09-21 07:10:54 +00:00
|
|
|
|
2020-10-29 11:55:57 +00:00
|
|
|
return int64(memoryUsageInBytes)
|
2020-09-16 07:21:10 +00:00
|
|
|
}
|
|
|
|
|
2020-11-12 03:18:23 +00:00
|
|
|
//-------------------------------------------------------------------------------------- preDm functions
|
2020-11-05 02:52:50 +00:00
|
|
|
func (s *Segment) segmentPreInsert(numOfRecords int) int64 {
|
2020-09-21 10:16:06 +00:00
|
|
|
/*
|
2020-10-24 02:45:57 +00:00
|
|
|
long int
|
|
|
|
PreInsert(CSegmentBase c_segment, long int size);
|
2020-09-09 07:24:07 +00:00
|
|
|
*/
|
2020-11-09 08:27:11 +00:00
|
|
|
var offset = C.PreInsert(s.segmentPtr, C.long(int64(numOfRecords)))
|
2020-09-09 07:24:07 +00:00
|
|
|
|
2020-09-12 08:57:37 +00:00
|
|
|
return int64(offset)
|
2020-09-09 07:24:07 +00:00
|
|
|
}
|
|
|
|
|
2020-11-05 02:52:50 +00:00
|
|
|
func (s *Segment) segmentPreDelete(numOfRecords int) int64 {
|
2020-09-21 10:16:06 +00:00
|
|
|
/*
|
2020-10-24 02:45:57 +00:00
|
|
|
long int
|
|
|
|
PreDelete(CSegmentBase c_segment, long int size);
|
2020-09-09 07:24:07 +00:00
|
|
|
*/
|
2020-11-09 08:27:11 +00:00
|
|
|
var offset = C.PreDelete(s.segmentPtr, C.long(int64(numOfRecords)))
|
2020-09-09 07:24:07 +00:00
|
|
|
|
2020-09-12 08:57:37 +00:00
|
|
|
return int64(offset)
|
2020-09-09 07:24:07 +00:00
|
|
|
}
|
|
|
|
|
2020-11-09 08:27:11 +00:00
|
|
|
//-------------------------------------------------------------------------------------- dm & search functions
|
2020-11-05 02:52:50 +00:00
|
|
|
func (s *Segment) segmentInsert(offset int64, entityIDs *[]UniqueID, timestamps *[]Timestamp, records *[]*commonpb.Blob) error {
|
2020-09-21 10:16:06 +00:00
|
|
|
/*
|
2020-11-26 08:01:31 +00:00
|
|
|
CStatus
|
2020-10-24 02:45:57 +00:00
|
|
|
Insert(CSegmentBase c_segment,
|
|
|
|
long int reserved_offset,
|
|
|
|
signed long int size,
|
|
|
|
const long* primary_keys,
|
|
|
|
const unsigned long* timestamps,
|
|
|
|
void* raw_data,
|
|
|
|
int sizeof_per_row,
|
|
|
|
signed long int count);
|
2020-09-02 08:23:50 +00:00
|
|
|
*/
|
2020-09-08 02:39:09 +00:00
|
|
|
// Blobs to one big blob
|
2020-11-05 02:52:50 +00:00
|
|
|
var numOfRow = len(*entityIDs)
|
|
|
|
var sizeofPerRow = len((*records)[0].Value)
|
|
|
|
|
|
|
|
assert.Equal(nil, numOfRow, len(*records))
|
|
|
|
|
|
|
|
var rawData = make([]byte, numOfRow*sizeofPerRow)
|
|
|
|
var copyOffset = 0
|
|
|
|
for i := 0; i < len(*records); i++ {
|
|
|
|
copy(rawData[copyOffset:], (*records)[i].Value)
|
|
|
|
copyOffset += sizeofPerRow
|
|
|
|
}
|
|
|
|
|
|
|
|
var cOffset = C.long(offset)
|
|
|
|
var cNumOfRows = C.long(numOfRow)
|
|
|
|
var cEntityIdsPtr = (*C.long)(&(*entityIDs)[0])
|
|
|
|
var cTimestampsPtr = (*C.ulong)(&(*timestamps)[0])
|
|
|
|
var cSizeofPerRow = C.int(sizeofPerRow)
|
|
|
|
var cRawDataVoidPtr = unsafe.Pointer(&rawData[0])
|
|
|
|
|
2020-11-09 08:27:11 +00:00
|
|
|
var status = C.Insert(s.segmentPtr,
|
2020-11-05 02:52:50 +00:00
|
|
|
cOffset,
|
|
|
|
cNumOfRows,
|
|
|
|
cEntityIdsPtr,
|
|
|
|
cTimestampsPtr,
|
|
|
|
cRawDataVoidPtr,
|
|
|
|
cSizeofPerRow,
|
|
|
|
cNumOfRows)
|
|
|
|
|
2020-11-26 08:01:31 +00:00
|
|
|
errorCode := status.error_code
|
|
|
|
|
|
|
|
if errorCode != 0 {
|
|
|
|
errorMsg := C.GoString(status.error_msg)
|
|
|
|
defer C.free(unsafe.Pointer(status.error_msg))
|
|
|
|
return errors.New("Insert failed, C runtime error detected, error code = " + strconv.Itoa(int(errorCode)) + ", error msg = " + errorMsg)
|
2020-11-05 02:52:50 +00:00
|
|
|
}
|
2020-09-02 09:18:49 +00:00
|
|
|
|
2021-01-12 10:03:24 +00:00
|
|
|
s.SetRecentlyModified(true)
|
2020-09-07 09:01:46 +00:00
|
|
|
return nil
|
2020-08-28 09:29:26 +00:00
|
|
|
}
|
|
|
|
|
2020-11-05 02:52:50 +00:00
|
|
|
func (s *Segment) segmentDelete(offset int64, entityIDs *[]UniqueID, timestamps *[]Timestamp) error {
|
2020-09-21 10:16:06 +00:00
|
|
|
/*
|
2020-11-26 08:01:31 +00:00
|
|
|
CStatus
|
2020-10-24 02:45:57 +00:00
|
|
|
Delete(CSegmentBase c_segment,
|
|
|
|
long int reserved_offset,
|
|
|
|
long size,
|
|
|
|
const long* primary_keys,
|
|
|
|
const unsigned long* timestamps);
|
2020-09-02 08:23:50 +00:00
|
|
|
*/
|
2020-09-09 07:24:07 +00:00
|
|
|
var cOffset = C.long(offset)
|
|
|
|
var cSize = C.long(len(*entityIDs))
|
2020-09-12 08:57:37 +00:00
|
|
|
var cEntityIdsPtr = (*C.long)(&(*entityIDs)[0])
|
2020-09-09 07:24:07 +00:00
|
|
|
var cTimestampsPtr = (*C.ulong)(&(*timestamps)[0])
|
2020-09-02 08:23:50 +00:00
|
|
|
|
2020-11-09 08:27:11 +00:00
|
|
|
var status = C.Delete(s.segmentPtr, cOffset, cSize, cEntityIdsPtr, cTimestampsPtr)
|
2020-09-02 09:18:49 +00:00
|
|
|
|
2020-11-26 08:01:31 +00:00
|
|
|
errorCode := status.error_code
|
|
|
|
|
|
|
|
if errorCode != 0 {
|
|
|
|
errorMsg := C.GoString(status.error_msg)
|
|
|
|
defer C.free(unsafe.Pointer(status.error_msg))
|
|
|
|
return errors.New("Delete failed, C runtime error detected, error code = " + strconv.Itoa(int(errorCode)) + ", error msg = " + errorMsg)
|
2020-09-02 09:18:49 +00:00
|
|
|
}
|
2020-09-02 08:23:50 +00:00
|
|
|
|
2020-09-07 09:01:46 +00:00
|
|
|
return nil
|
2020-08-28 09:29:26 +00:00
|
|
|
}
|
|
|
|
|
2020-11-19 06:13:39 +00:00
|
|
|
func (s *Segment) segmentSearch(plan *Plan,
|
|
|
|
placeHolderGroups []*PlaceholderGroup,
|
2020-11-26 08:01:31 +00:00
|
|
|
timestamp []Timestamp) (*SearchResult, error) {
|
2020-11-09 08:27:11 +00:00
|
|
|
/*
|
2020-11-26 08:01:31 +00:00
|
|
|
CStatus
|
|
|
|
Search(void* plan,
|
2020-11-19 06:13:39 +00:00
|
|
|
void* placeholder_groups,
|
|
|
|
uint64_t* timestamps,
|
|
|
|
int num_groups,
|
|
|
|
long int* result_ids,
|
|
|
|
float* result_distances);
|
2020-11-09 08:27:11 +00:00
|
|
|
*/
|
|
|
|
|
2020-11-17 02:07:42 +00:00
|
|
|
cPlaceholderGroups := make([]C.CPlaceholderGroup, 0)
|
|
|
|
for _, pg := range placeHolderGroups {
|
|
|
|
cPlaceholderGroups = append(cPlaceholderGroups, (*pg).cPlaceholderGroup)
|
2020-09-17 17:53:18 +00:00
|
|
|
}
|
2020-09-02 08:23:50 +00:00
|
|
|
|
2020-11-26 08:01:31 +00:00
|
|
|
var searchResult SearchResult
|
2020-11-17 02:07:42 +00:00
|
|
|
var cTimestamp = (*C.ulong)(×tamp[0])
|
|
|
|
var cPlaceHolder = (*C.CPlaceholderGroup)(&cPlaceholderGroups[0])
|
|
|
|
var cNumGroups = C.int(len(placeHolderGroups))
|
2020-12-03 11:00:11 +00:00
|
|
|
var cQueryResult = (*C.CQueryResult)(&searchResult.cQueryResult)
|
2020-09-02 08:23:50 +00:00
|
|
|
|
2020-11-26 08:01:31 +00:00
|
|
|
var status = C.Search(s.segmentPtr, plan.cPlan, cPlaceHolder, cTimestamp, cNumGroups, cQueryResult)
|
|
|
|
errorCode := status.error_code
|
2020-11-26 06:29:01 +00:00
|
|
|
|
2020-11-26 08:01:31 +00:00
|
|
|
if errorCode != 0 {
|
|
|
|
errorMsg := C.GoString(status.error_msg)
|
|
|
|
defer C.free(unsafe.Pointer(status.error_msg))
|
|
|
|
return nil, errors.New("Search failed, C runtime error detected, error code = " + strconv.Itoa(int(errorCode)) + ", error msg = " + errorMsg)
|
2020-11-26 07:18:36 +00:00
|
|
|
}
|
2020-11-26 08:01:31 +00:00
|
|
|
|
|
|
|
return &searchResult, nil
|
2020-08-28 09:29:26 +00:00
|
|
|
}
|
2020-12-03 11:00:11 +00:00
|
|
|
|
|
|
|
func (s *Segment) fillTargetEntry(plan *Plan,
|
|
|
|
result *SearchResult) error {
|
|
|
|
|
|
|
|
var status = C.FillTargetEntry(s.segmentPtr, plan.cPlan, result.cQueryResult)
|
|
|
|
errorCode := status.error_code
|
|
|
|
|
|
|
|
if errorCode != 0 {
|
|
|
|
errorMsg := C.GoString(status.error_msg)
|
|
|
|
defer C.free(unsafe.Pointer(status.error_msg))
|
|
|
|
return errors.New("FillTargetEntry failed, C runtime error detected, error code = " + strconv.Itoa(int(errorCode)) + ", error msg = " + errorMsg)
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
2020-12-24 12:55:40 +00:00
|
|
|
|
|
|
|
// segment, err := loadIndexService.replica.getSegmentByID(segmentID)
|
|
|
|
func (s *Segment) updateSegmentIndex(loadIndexInfo *LoadIndexInfo) error {
|
|
|
|
status := C.UpdateSegmentIndex(s.segmentPtr, loadIndexInfo.cLoadIndexInfo)
|
|
|
|
errorCode := status.error_code
|
|
|
|
|
|
|
|
if errorCode != 0 {
|
|
|
|
errorMsg := C.GoString(status.error_msg)
|
|
|
|
defer C.free(unsafe.Pointer(status.error_msg))
|
|
|
|
return errors.New("updateSegmentIndex failed, C runtime error detected, error code = " + strconv.Itoa(int(errorCode)) + ", error msg = " + errorMsg)
|
|
|
|
}
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|
2021-01-12 10:03:24 +00:00
|
|
|
|
|
|
|
func (s *Segment) setIndexParam(fieldID int64, indexParamKv []*commonpb.KeyValuePair) error {
|
|
|
|
s.paramMutex.Lock()
|
|
|
|
defer s.paramMutex.Unlock()
|
|
|
|
indexParamMap := make(indexParam)
|
|
|
|
if indexParamKv == nil {
|
|
|
|
return errors.New("loadIndexMsg's indexParam empty")
|
|
|
|
}
|
|
|
|
for _, param := range indexParamKv {
|
|
|
|
indexParamMap[param.Key] = param.Value
|
|
|
|
}
|
|
|
|
s.indexParam[fieldID] = indexParamMap
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (s *Segment) matchIndexParam(fieldID int64, indexParamKv []*commonpb.KeyValuePair) bool {
|
|
|
|
s.paramMutex.RLock()
|
|
|
|
defer s.paramMutex.RUnlock()
|
|
|
|
fieldIndexParam := s.indexParam[fieldID]
|
|
|
|
if fieldIndexParam == nil {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
paramSize := len(s.indexParam)
|
|
|
|
matchCount := 0
|
|
|
|
for _, param := range indexParamKv {
|
|
|
|
value, ok := fieldIndexParam[param.Key]
|
|
|
|
if !ok {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if param.Value != value {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
matchCount++
|
|
|
|
}
|
|
|
|
return paramSize == matchCount
|
|
|
|
}
|