enhance: Remove multiple vector field limit (#27827)

issue: https://github.com/milvus-io/milvus/issues/25639

/kind improvement
Signed-off-by: xige-16 <xi.ge@zilliz.com>

Signed-off-by: xige-16 <xi.ge@zilliz.com>
pull/29569/head
xige-16 2023-12-28 16:40:46 +08:00 committed by GitHub
parent 497ced9588
commit 0a70e8b601
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
13 changed files with 283 additions and 64 deletions

View File

@ -193,6 +193,7 @@ proxy:
# As of today (2.2.0 and after) it is strongly DISCOURAGED to set maxFieldNum >= 64. # As of today (2.2.0 and after) it is strongly DISCOURAGED to set maxFieldNum >= 64.
# So adjust at your risk! # So adjust at your risk!
maxFieldNum: 64 maxFieldNum: 64
maxVectorFieldNum: 4 # Maximum number of vector fields in a collection, (0, 10].
maxShardNum: 16 # Maximum number of shards in a collection maxShardNum: 16 # Maximum number of shards in a collection
maxDimension: 32768 # Maximum dimension of a vector maxDimension: 32768 # Maximum dimension of a vector
# Whether to produce gin logs.\n # Whether to produce gin logs.\n

View File

@ -268,6 +268,9 @@ func (coord *DataCoordMock) DropIndex(ctx context.Context, req *indexpb.DropInde
} }
func (coord *DataCoordMock) GetIndexState(ctx context.Context, req *indexpb.GetIndexStateRequest, opts ...grpc.CallOption) (*indexpb.GetIndexStateResponse, error) { func (coord *DataCoordMock) GetIndexState(ctx context.Context, req *indexpb.GetIndexStateRequest, opts ...grpc.CallOption) (*indexpb.GetIndexStateResponse, error) {
if coord.GetIndexStateFunc != nil {
return coord.GetIndexStateFunc(ctx, req, opts...)
}
return &indexpb.GetIndexStateResponse{ return &indexpb.GetIndexStateResponse{
Status: merr.Success(), Status: merr.Success(),
State: commonpb.IndexState_Finished, State: commonpb.IndexState_Finished,
@ -291,6 +294,9 @@ func (coord *DataCoordMock) GetIndexInfos(ctx context.Context, req *indexpb.GetI
// DescribeIndex describe the index info of the collection. // DescribeIndex describe the index info of the collection.
func (coord *DataCoordMock) DescribeIndex(ctx context.Context, req *indexpb.DescribeIndexRequest, opts ...grpc.CallOption) (*indexpb.DescribeIndexResponse, error) { func (coord *DataCoordMock) DescribeIndex(ctx context.Context, req *indexpb.DescribeIndexRequest, opts ...grpc.CallOption) (*indexpb.DescribeIndexResponse, error) {
if coord.DescribeIndexFunc != nil {
return coord.DescribeIndexFunc(ctx, req, opts...)
}
return &indexpb.DescribeIndexResponse{ return &indexpb.DescribeIndexResponse{
Status: merr.Success(), Status: merr.Success(),
IndexInfos: nil, IndexInfos: nil,

View File

@ -519,9 +519,11 @@ func TestProxy(t *testing.T) {
shardsNum := common.DefaultShardsNum shardsNum := common.DefaultShardsNum
int64Field := "int64" int64Field := "int64"
floatVecField := "fVec" floatVecField := "fVec"
binaryVecField := "bVec"
dim := 128 dim := 128
rowNum := 3000 rowNum := 3000
indexName := "_default" floatIndexName := "float_index"
binaryIndexName := "binary_index"
nlist := 10 nlist := 10
// nprobe := 10 // nprobe := 10
// topk := 10 // topk := 10
@ -558,6 +560,21 @@ func TestProxy(t *testing.T) {
IndexParams: nil, IndexParams: nil,
AutoID: false, AutoID: false,
} }
bVec := &schemapb.FieldSchema{
FieldID: 0,
Name: binaryVecField,
IsPrimaryKey: false,
Description: "",
DataType: schemapb.DataType_BinaryVector,
TypeParams: []*commonpb.KeyValuePair{
{
Key: common.DimKey,
Value: strconv.Itoa(dim),
},
},
IndexParams: nil,
AutoID: false,
}
return &schemapb.CollectionSchema{ return &schemapb.CollectionSchema{
Name: collectionName, Name: collectionName,
Description: "", Description: "",
@ -565,6 +582,7 @@ func TestProxy(t *testing.T) {
Fields: []*schemapb.FieldSchema{ Fields: []*schemapb.FieldSchema{
pk, pk,
fVec, fVec,
bVec,
}, },
} }
} }
@ -585,13 +603,14 @@ func TestProxy(t *testing.T) {
constructCollectionInsertRequest := func() *milvuspb.InsertRequest { constructCollectionInsertRequest := func() *milvuspb.InsertRequest {
fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim) fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim)
bVecColumn := newBinaryVectorFieldData(binaryVecField, rowNum, dim)
hashKeys := generateHashKeys(rowNum) hashKeys := generateHashKeys(rowNum)
return &milvuspb.InsertRequest{ return &milvuspb.InsertRequest{
Base: nil, Base: nil,
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
PartitionName: "", PartitionName: "",
FieldsData: []*schemapb.FieldData{fVecColumn}, FieldsData: []*schemapb.FieldData{fVecColumn, bVecColumn},
HashKeys: hashKeys, HashKeys: hashKeys,
NumRows: uint32(rowNum), NumRows: uint32(rowNum),
} }
@ -599,13 +618,14 @@ func TestProxy(t *testing.T) {
constructPartitionInsertRequest := func() *milvuspb.InsertRequest { constructPartitionInsertRequest := func() *milvuspb.InsertRequest {
fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim) fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim)
bVecColumn := newBinaryVectorFieldData(binaryVecField, rowNum, dim)
hashKeys := generateHashKeys(rowNum) hashKeys := generateHashKeys(rowNum)
return &milvuspb.InsertRequest{ return &milvuspb.InsertRequest{
Base: nil, Base: nil,
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
PartitionName: partitionName, PartitionName: partitionName,
FieldsData: []*schemapb.FieldData{fVecColumn}, FieldsData: []*schemapb.FieldData{fVecColumn, bVecColumn},
HashKeys: hashKeys, HashKeys: hashKeys,
NumRows: uint32(rowNum), NumRows: uint32(rowNum),
} }
@ -613,44 +633,75 @@ func TestProxy(t *testing.T) {
constructCollectionUpsertRequest := func() *milvuspb.UpsertRequest { constructCollectionUpsertRequest := func() *milvuspb.UpsertRequest {
fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim) fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim)
bVecColumn := newBinaryVectorFieldData(binaryVecField, rowNum, dim)
hashKeys := generateHashKeys(rowNum) hashKeys := generateHashKeys(rowNum)
return &milvuspb.UpsertRequest{ return &milvuspb.UpsertRequest{
Base: nil, Base: nil,
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
PartitionName: partitionName, PartitionName: partitionName,
FieldsData: []*schemapb.FieldData{fVecColumn}, FieldsData: []*schemapb.FieldData{fVecColumn, bVecColumn},
HashKeys: hashKeys, HashKeys: hashKeys,
NumRows: uint32(rowNum), NumRows: uint32(rowNum),
} }
} }
constructCreateIndexRequest := func() *milvuspb.CreateIndexRequest { constructCreateIndexRequest := func(dataType schemapb.DataType) *milvuspb.CreateIndexRequest {
return &milvuspb.CreateIndexRequest{ req := &milvuspb.CreateIndexRequest{
Base: nil, Base: nil,
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
FieldName: floatVecField,
IndexName: indexName,
ExtraParams: []*commonpb.KeyValuePair{
{
Key: common.DimKey,
Value: strconv.Itoa(dim),
},
{
Key: common.MetricTypeKey,
Value: metric.L2,
},
{
Key: common.IndexTypeKey,
Value: "IVF_FLAT",
},
{
Key: "nlist",
Value: strconv.Itoa(nlist),
},
},
} }
switch dataType {
case schemapb.DataType_FloatVector:
{
req.FieldName = floatVecField
req.IndexName = floatIndexName
req.ExtraParams = []*commonpb.KeyValuePair{
{
Key: common.DimKey,
Value: strconv.Itoa(dim),
},
{
Key: common.MetricTypeKey,
Value: metric.L2,
},
{
Key: common.IndexTypeKey,
Value: "IVF_FLAT",
},
{
Key: "nlist",
Value: strconv.Itoa(nlist),
},
}
}
case schemapb.DataType_BinaryVector:
{
req.FieldName = binaryVecField
req.IndexName = binaryIndexName
req.ExtraParams = []*commonpb.KeyValuePair{
{
Key: common.DimKey,
Value: strconv.Itoa(dim),
},
{
Key: common.MetricTypeKey,
Value: metric.JACCARD,
},
{
Key: common.IndexTypeKey,
Value: "BIN_IVF_FLAT",
},
{
Key: "nlist",
Value: strconv.Itoa(nlist),
},
}
}
}
return req
} }
wg.Add(1) wg.Add(1)
@ -1098,9 +1149,9 @@ func TestProxy(t *testing.T) {
}) })
wg.Add(1) wg.Add(1)
t.Run("create index", func(t *testing.T) { t.Run("create index for floatVec field", func(t *testing.T) {
defer wg.Done() defer wg.Done()
req := constructCreateIndexRequest() req := constructCreateIndexRequest(schemapb.DataType_FloatVector)
resp, err := proxy.CreateIndex(ctx, req) resp, err := proxy.CreateIndex(ctx, req)
assert.NoError(t, err) assert.NoError(t, err)
@ -1113,7 +1164,7 @@ func TestProxy(t *testing.T) {
req := &milvuspb.AlterIndexRequest{ req := &milvuspb.AlterIndexRequest{
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
IndexName: indexName, IndexName: floatIndexName,
ExtraParams: []*commonpb.KeyValuePair{ ExtraParams: []*commonpb.KeyValuePair{
{ {
Key: common.MmapEnabledKey, Key: common.MmapEnabledKey,
@ -1139,14 +1190,14 @@ func TestProxy(t *testing.T) {
}) })
err = merr.CheckRPCCall(resp, err) err = merr.CheckRPCCall(resp, err)
assert.NoError(t, err) assert.NoError(t, err)
assert.Equal(t, indexName, resp.IndexDescriptions[0].IndexName) assert.Equal(t, floatIndexName, resp.IndexDescriptions[0].IndexName)
assert.True(t, common.IsMmapEnabled(resp.IndexDescriptions[0].GetParams()...), "params: %+v", resp.IndexDescriptions[0]) assert.True(t, common.IsMmapEnabled(resp.IndexDescriptions[0].GetParams()...), "params: %+v", resp.IndexDescriptions[0])
// disable mmap then the tests below could continue // disable mmap then the tests below could continue
req := &milvuspb.AlterIndexRequest{ req := &milvuspb.AlterIndexRequest{
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
IndexName: indexName, IndexName: floatIndexName,
ExtraParams: []*commonpb.KeyValuePair{ ExtraParams: []*commonpb.KeyValuePair{
{ {
Key: common.MmapEnabledKey, Key: common.MmapEnabledKey,
@ -1170,7 +1221,7 @@ func TestProxy(t *testing.T) {
}) })
assert.NoError(t, err) assert.NoError(t, err)
assert.Equal(t, commonpb.ErrorCode_Success, resp.GetStatus().GetErrorCode()) assert.Equal(t, commonpb.ErrorCode_Success, resp.GetStatus().GetErrorCode())
indexName = resp.IndexDescriptions[0].IndexName assert.Equal(t, floatIndexName, resp.IndexDescriptions[0].IndexName)
}) })
wg.Add(1) wg.Add(1)
@ -1181,7 +1232,7 @@ func TestProxy(t *testing.T) {
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
FieldName: floatVecField, FieldName: floatVecField,
IndexName: indexName, IndexName: floatIndexName,
}) })
assert.NoError(t, err) assert.NoError(t, err)
assert.Equal(t, commonpb.ErrorCode_Success, resp.GetStatus().GetErrorCode()) assert.Equal(t, commonpb.ErrorCode_Success, resp.GetStatus().GetErrorCode())
@ -1195,12 +1246,44 @@ func TestProxy(t *testing.T) {
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
FieldName: floatVecField, FieldName: floatVecField,
IndexName: indexName, IndexName: floatIndexName,
}) })
assert.NoError(t, err) assert.NoError(t, err)
assert.Equal(t, commonpb.ErrorCode_Success, resp.GetStatus().GetErrorCode()) assert.Equal(t, commonpb.ErrorCode_Success, resp.GetStatus().GetErrorCode())
}) })
wg.Add(1)
t.Run("load collection not all vecFields with index", func(t *testing.T) {
defer wg.Done()
{
stateResp, err := proxy.GetLoadState(ctx, &milvuspb.GetLoadStateRequest{
DbName: dbName,
CollectionName: collectionName,
})
assert.NoError(t, err)
assert.Equal(t, commonpb.ErrorCode_Success, stateResp.GetStatus().GetErrorCode())
assert.Equal(t, commonpb.LoadState_LoadStateNotLoad, stateResp.State)
}
resp, err := proxy.LoadCollection(ctx, &milvuspb.LoadCollectionRequest{
Base: nil,
DbName: dbName,
CollectionName: collectionName,
})
assert.NoError(t, err)
assert.NotEqual(t, commonpb.ErrorCode_Success, resp.GetErrorCode())
})
wg.Add(1)
t.Run("create index for binVec field", func(t *testing.T) {
defer wg.Done()
req := constructCreateIndexRequest(schemapb.DataType_BinaryVector)
resp, err := proxy.CreateIndex(ctx, req)
assert.NoError(t, err)
assert.Equal(t, commonpb.ErrorCode_Success, resp.ErrorCode)
})
loaded := true loaded := true
wg.Add(1) wg.Add(1)
t.Run("load collection", func(t *testing.T) { t.Run("load collection", func(t *testing.T) {
@ -2198,7 +2281,7 @@ func TestProxy(t *testing.T) {
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
FieldName: floatVecField, FieldName: floatVecField,
IndexName: indexName, IndexName: floatIndexName,
}) })
assert.NoError(t, err) assert.NoError(t, err)
assert.Equal(t, commonpb.ErrorCode_Success, resp.ErrorCode) assert.Equal(t, commonpb.ErrorCode_Success, resp.ErrorCode)
@ -3448,6 +3531,21 @@ func TestProxy(t *testing.T) {
IndexParams: nil, IndexParams: nil,
AutoID: false, AutoID: false,
} }
bVec := &schemapb.FieldSchema{
FieldID: 0,
Name: binaryVecField,
IsPrimaryKey: false,
Description: "",
DataType: schemapb.DataType_BinaryVector,
TypeParams: []*commonpb.KeyValuePair{
{
Key: common.DimKey,
Value: strconv.Itoa(dim),
},
},
IndexParams: nil,
AutoID: false,
}
return &schemapb.CollectionSchema{ return &schemapb.CollectionSchema{
Name: collectionName, Name: collectionName,
Description: "", Description: "",
@ -3455,6 +3553,7 @@ func TestProxy(t *testing.T) {
Fields: []*schemapb.FieldSchema{ Fields: []*schemapb.FieldSchema{
pk, pk,
fVec, fVec,
bVec,
}, },
} }
} }
@ -3476,13 +3575,14 @@ func TestProxy(t *testing.T) {
constructPartitionReqUpsertRequestValid := func() *milvuspb.UpsertRequest { constructPartitionReqUpsertRequestValid := func() *milvuspb.UpsertRequest {
pkFieldData := newScalarFieldData(schema.Fields[0], int64Field, rowNum) pkFieldData := newScalarFieldData(schema.Fields[0], int64Field, rowNum)
fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim) fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim)
bVecColumn := newBinaryVectorFieldData(binaryVecField, rowNum, dim)
hashKeys := generateHashKeys(rowNum) hashKeys := generateHashKeys(rowNum)
return &milvuspb.UpsertRequest{ return &milvuspb.UpsertRequest{
Base: nil, Base: nil,
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
PartitionName: partitionName, PartitionName: partitionName,
FieldsData: []*schemapb.FieldData{pkFieldData, fVecColumn}, FieldsData: []*schemapb.FieldData{pkFieldData, fVecColumn, bVecColumn},
HashKeys: hashKeys, HashKeys: hashKeys,
NumRows: uint32(rowNum), NumRows: uint32(rowNum),
} }
@ -3491,13 +3591,14 @@ func TestProxy(t *testing.T) {
constructPartitionReqUpsertRequestInvalid := func() *milvuspb.UpsertRequest { constructPartitionReqUpsertRequestInvalid := func() *milvuspb.UpsertRequest {
pkFieldData := newScalarFieldData(schema.Fields[0], int64Field, rowNum) pkFieldData := newScalarFieldData(schema.Fields[0], int64Field, rowNum)
fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim) fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim)
bVecColumn := newBinaryVectorFieldData(binaryVecField, rowNum, dim)
hashKeys := generateHashKeys(rowNum) hashKeys := generateHashKeys(rowNum)
return &milvuspb.UpsertRequest{ return &milvuspb.UpsertRequest{
Base: nil, Base: nil,
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
PartitionName: "%$@", PartitionName: "%$@",
FieldsData: []*schemapb.FieldData{pkFieldData, fVecColumn}, FieldsData: []*schemapb.FieldData{pkFieldData, fVecColumn, bVecColumn},
HashKeys: hashKeys, HashKeys: hashKeys,
NumRows: uint32(rowNum), NumRows: uint32(rowNum),
} }
@ -3506,13 +3607,14 @@ func TestProxy(t *testing.T) {
constructCollectionUpsertRequestValid := func() *milvuspb.UpsertRequest { constructCollectionUpsertRequestValid := func() *milvuspb.UpsertRequest {
pkFieldData := newScalarFieldData(schema.Fields[0], int64Field, rowNum) pkFieldData := newScalarFieldData(schema.Fields[0], int64Field, rowNum)
fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim) fVecColumn := newFloatVectorFieldData(floatVecField, rowNum, dim)
bVecColumn := newBinaryVectorFieldData(binaryVecField, rowNum, dim)
hashKeys := generateHashKeys(rowNum) hashKeys := generateHashKeys(rowNum)
return &milvuspb.UpsertRequest{ return &milvuspb.UpsertRequest{
Base: nil, Base: nil,
DbName: dbName, DbName: dbName,
CollectionName: collectionName, CollectionName: collectionName,
PartitionName: partitionName, PartitionName: partitionName,
FieldsData: []*schemapb.FieldData{pkFieldData, fVecColumn}, FieldsData: []*schemapb.FieldData{pkFieldData, fVecColumn, bVecColumn},
HashKeys: hashKeys, HashKeys: hashKeys,
NumRows: uint32(rowNum), NumRows: uint32(rowNum),
} }

View File

@ -226,6 +226,10 @@ func (t *createCollectionTask) PreExecute(ctx context.Context) error {
return fmt.Errorf("maximum field's number should be limited to %d", Params.ProxyCfg.MaxFieldNum.GetAsInt()) return fmt.Errorf("maximum field's number should be limited to %d", Params.ProxyCfg.MaxFieldNum.GetAsInt())
} }
if len(typeutil.GetVectorFieldSchemas(t.schema)) > Params.ProxyCfg.MaxVectorFieldNum.GetAsInt() {
return fmt.Errorf("maximum vector field's number should be limited to %d", Params.ProxyCfg.MaxVectorFieldNum.GetAsInt())
}
// validate collection name // validate collection name
if err := validateCollectionName(t.schema.Name); err != nil { if err := validateCollectionName(t.schema.Name); err != nil {
return err return err
@ -1456,19 +1460,24 @@ func (t *loadCollectionTask) Execute(ctx context.Context) (err error) {
return err return err
} }
hasVecIndex := false // not support multiple indexes on one field
fieldIndexIDs := make(map[int64]int64) fieldIndexIDs := make(map[int64]int64)
for _, index := range indexResponse.IndexInfos { for _, index := range indexResponse.IndexInfos {
fieldIndexIDs[index.FieldID] = index.IndexID fieldIndexIDs[index.FieldID] = index.IndexID
for _, field := range collSchema.Fields { }
if index.FieldID == field.FieldID && (field.DataType == schemapb.DataType_FloatVector || field.DataType == schemapb.DataType_BinaryVector || field.DataType == schemapb.DataType_Float16Vector) {
hasVecIndex = true unindexedVecFields := make([]string, 0)
for _, field := range collSchema.GetFields() {
if isVectorType(field.GetDataType()) {
if _, ok := fieldIndexIDs[field.GetFieldID()]; !ok {
unindexedVecFields = append(unindexedVecFields, field.GetName())
} }
} }
} }
if !hasVecIndex {
errMsg := fmt.Sprintf("there is no vector index on collection: %s, please create index firstly", t.LoadCollectionRequest.CollectionName) if len(unindexedVecFields) != 0 {
log.Error(errMsg) errMsg := fmt.Sprintf("there is no vector index on field: %v, please create index firstly", unindexedVecFields)
log.Debug(errMsg)
return errors.New(errMsg) return errors.New(errMsg)
} }
request := &querypb.LoadCollectionRequest{ request := &querypb.LoadCollectionRequest{

View File

@ -294,14 +294,16 @@ func (t *searchTask) PreExecute(ctx context.Context) error {
if t.request.GetDslType() == commonpb.DslType_BoolExprV1 { if t.request.GetDslType() == commonpb.DslType_BoolExprV1 {
annsField, err := funcutil.GetAttrByKeyFromRepeatedKV(AnnsFieldKey, t.request.GetSearchParams()) annsField, err := funcutil.GetAttrByKeyFromRepeatedKV(AnnsFieldKey, t.request.GetSearchParams())
if err != nil || len(annsField) == 0 { if err != nil || len(annsField) == 0 {
if enableMultipleVectorFields { vecFields := typeutil.GetVectorFieldSchemas(t.schema)
return errors.New(AnnsFieldKey + " not found in search_params") if len(vecFields) == 0 {
}
vecFieldSchema, err2 := typeutil.GetVectorFieldSchema(t.schema)
if err2 != nil {
return errors.New(AnnsFieldKey + " not found in schema") return errors.New(AnnsFieldKey + " not found in schema")
} }
annsField = vecFieldSchema.Name
if enableMultipleVectorFields && len(vecFields) > 1 {
return errors.New("multiple anns_fields exist, please specify a anns_field in search_params")
}
annsField = vecFields[0].Name
} }
queryInfo, offset, err := parseSearchInfo(t.request.GetSearchParams()) queryInfo, offset, err := parseSearchInfo(t.request.GetSearchParams())
if err != nil { if err != nil {

View File

@ -1700,6 +1700,7 @@ func TestSearchTask_ErrExecute(t *testing.T) {
}, },
CollectionName: collectionName, CollectionName: collectionName,
Nq: 2, Nq: 2,
DslType: commonpb.DslType_BoolExprV1,
}, },
qc: qc, qc: qc,
lb: lb, lb: lb,
@ -1711,7 +1712,13 @@ func TestSearchTask_ErrExecute(t *testing.T) {
assert.NoError(t, task.OnEnqueue()) assert.NoError(t, task.OnEnqueue())
task.ctx = ctx task.ctx = ctx
assert.NoError(t, task.PreExecute(ctx)) if enableMultipleVectorFields {
err = task.PreExecute(ctx)
assert.Error(t, err)
assert.Equal(t, err.Error(), "multiple anns_fields exist, please specify a anns_field in search_params")
} else {
assert.NoError(t, task.PreExecute(ctx))
}
qn.EXPECT().Search(mock.Anything, mock.Anything).Return(nil, errors.New("mock error")) qn.EXPECT().Search(mock.Anything, mock.Anything).Return(nil, errors.New("mock error"))
assert.Error(t, task.Execute(ctx)) assert.Error(t, task.Execute(ctx))

View File

@ -682,10 +682,36 @@ func TestCreateCollectionTask(t *testing.T) {
err = task.PreExecute(ctx) err = task.PreExecute(ctx)
assert.Error(t, err) assert.Error(t, err)
// too many vector fields
schema = proto.Clone(schemaBackup).(*schemapb.CollectionSchema)
schema.Fields = append(schema.Fields, schema.Fields[0])
for i := 0; i < Params.ProxyCfg.MaxVectorFieldNum.GetAsInt(); i++ {
schema.Fields = append(schema.Fields, &schemapb.FieldSchema{
FieldID: 101,
Name: floatVecField + "_" + strconv.Itoa(i),
IsPrimaryKey: false,
Description: "",
DataType: schemapb.DataType_FloatVector,
TypeParams: []*commonpb.KeyValuePair{
{
Key: common.DimKey,
Value: strconv.Itoa(testVecDim),
},
},
IndexParams: nil,
AutoID: false,
})
}
tooManyVectorFieldsSchema, err := proto.Marshal(schema)
assert.NoError(t, err)
task.CreateCollectionRequest.Schema = tooManyVectorFieldsSchema
err = task.PreExecute(ctx)
assert.Error(t, err)
task.CreateCollectionRequest = reqBackup task.CreateCollectionRequest = reqBackup
// validateCollectionName // validateCollectionName
schema = proto.Clone(schemaBackup).(*schemapb.CollectionSchema)
schema.Name = " " // empty schema.Name = " " // empty
emptyNameSchema, err := proto.Marshal(schema) emptyNameSchema, err := proto.Marshal(schema)
assert.NoError(t, err) assert.NoError(t, err)
@ -2551,6 +2577,42 @@ func Test_loadCollectionTask_Execute(t *testing.T) {
err := lct.Execute(ctx) err := lct.Execute(ctx)
assert.Error(t, err) assert.Error(t, err)
}) })
t.Run("not all vector fields with index", func(t *testing.T) {
vecFields := make([]*schemapb.FieldSchema, 0)
for _, field := range newTestSchema().GetFields() {
if isVectorType(field.GetDataType()) {
vecFields = append(vecFields, field)
}
}
assert.GreaterOrEqual(t, len(vecFields), 2)
dc.DescribeIndexFunc = func(ctx context.Context, request *indexpb.DescribeIndexRequest, opts ...grpc.CallOption) (*indexpb.DescribeIndexResponse, error) {
return &indexpb.DescribeIndexResponse{
Status: merr.Success(),
IndexInfos: []*indexpb.IndexInfo{
{
CollectionID: collectionID,
FieldID: vecFields[0].FieldID,
IndexName: indexName,
IndexID: indexID,
TypeParams: nil,
IndexParams: nil,
IndexedRows: 1025,
TotalRows: 1025,
State: commonpb.IndexState_Finished,
IndexStateFailReason: "",
IsAutoIndex: false,
UserIndexParams: nil,
},
},
}, nil
}
err := lct.Execute(ctx)
assert.Error(t, err)
})
} }
func Test_loadPartitionTask_Execute(t *testing.T) { func Test_loadPartitionTask_Execute(t *testing.T) {

View File

@ -56,7 +56,7 @@ const (
boundedTS = 2 boundedTS = 2
// enableMultipleVectorFields indicates whether to enable multiple vector fields. // enableMultipleVectorFields indicates whether to enable multiple vector fields.
enableMultipleVectorFields = false enableMultipleVectorFields = true
defaultMaxVarCharLength = 65535 defaultMaxVarCharLength = 65535

View File

@ -952,6 +952,7 @@ type proxyConfig struct {
MinPasswordLength ParamItem `refreshable:"true"` MinPasswordLength ParamItem `refreshable:"true"`
MaxPasswordLength ParamItem `refreshable:"true"` MaxPasswordLength ParamItem `refreshable:"true"`
MaxFieldNum ParamItem `refreshable:"true"` MaxFieldNum ParamItem `refreshable:"true"`
MaxVectorFieldNum ParamItem `refreshable:"true"`
MaxShardNum ParamItem `refreshable:"true"` MaxShardNum ParamItem `refreshable:"true"`
MaxDimension ParamItem `refreshable:"true"` MaxDimension ParamItem `refreshable:"true"`
GinLogging ParamItem `refreshable:"false"` GinLogging ParamItem `refreshable:"false"`
@ -1047,6 +1048,22 @@ So adjust at your risk!`,
} }
p.MaxFieldNum.Init(base.mgr) p.MaxFieldNum.Init(base.mgr)
p.MaxVectorFieldNum = ParamItem{
Key: "proxy.maxVectorFieldNum",
Version: "2.4.0",
DefaultValue: "4",
Formatter: func(v string) string {
if getAsInt(v) > 10 {
return "10"
}
return v
},
PanicIfEmpty: true,
Doc: "Maximum number of vector fields in a collection.",
Export: true,
}
p.MaxVectorFieldNum.Init(base.mgr)
p.MaxShardNum = ParamItem{ p.MaxShardNum = ParamItem{
Key: "proxy.maxShardNum", Key: "proxy.maxShardNum",
DefaultValue: "16", DefaultValue: "16",

View File

@ -139,6 +139,8 @@ func TestComponentParam(t *testing.T) {
t.Logf("MaxFieldNum: %d", Params.MaxFieldNum.GetAsInt64()) t.Logf("MaxFieldNum: %d", Params.MaxFieldNum.GetAsInt64())
t.Logf("MaxVectorFieldNum: %d", Params.MaxVectorFieldNum.GetAsInt64())
t.Logf("MaxShardNum: %d", Params.MaxShardNum.GetAsInt64()) t.Logf("MaxShardNum: %d", Params.MaxShardNum.GetAsInt64())
t.Logf("MaxDimension: %d", Params.MaxDimension.GetAsInt64()) t.Logf("MaxDimension: %d", Params.MaxDimension.GetAsInt64())

View File

@ -782,6 +782,18 @@ func GetVectorFieldSchema(schema *schemapb.CollectionSchema) (*schemapb.FieldSch
return nil, errors.New("vector field is not found") return nil, errors.New("vector field is not found")
} }
// GetVectorFieldSchemas get vector fields schema from collection schema.
func GetVectorFieldSchemas(schema *schemapb.CollectionSchema) []*schemapb.FieldSchema {
ret := make([]*schemapb.FieldSchema, 0)
for _, fieldSchema := range schema.Fields {
if IsVectorType(fieldSchema.DataType) {
ret = append(ret, fieldSchema)
}
}
return ret
}
// GetPrimaryFieldSchema get primary field schema from collection schema // GetPrimaryFieldSchema get primary field schema from collection schema
func GetPrimaryFieldSchema(schema *schemapb.CollectionSchema) (*schemapb.FieldSchema, error) { func GetPrimaryFieldSchema(schema *schemapb.CollectionSchema) (*schemapb.FieldSchema, error) {
for _, fieldSchema := range schema.Fields { for _, fieldSchema := range schema.Fields {

View File

@ -456,7 +456,7 @@ class TestCollectionParams(TestcaseBase):
""" """
target: test collection with multi float vectors target: test collection with multi float vectors
method: create collection with two float-vec fields method: create collection with two float-vec fields
expected: raise exception (not supported yet) expected: Collection created successfully
""" """
# 1. connect # 1. connect
self._connect() self._connect()
@ -465,25 +465,24 @@ class TestCollectionParams(TestcaseBase):
fields = [cf.gen_int64_field(is_primary=True), cf.gen_float_field(), fields = [cf.gen_int64_field(is_primary=True), cf.gen_float_field(),
cf.gen_float_vec_field(dim=default_dim), cf.gen_float_vec_field(name="tmp", dim=default_dim)] cf.gen_float_vec_field(dim=default_dim), cf.gen_float_vec_field(name="tmp", dim=default_dim)]
schema = cf.gen_collection_schema(fields=fields) schema = cf.gen_collection_schema(fields=fields)
err_msg = "multiple vector fields is not supported"
self.collection_wrap.init_collection(c_name, schema=schema, self.collection_wrap.init_collection(c_name, schema=schema,
check_task=CheckTasks.err_res, check_task=CheckTasks.check_collection_property,
check_items={"err_code": 1, "err_msg": err_msg}) check_items={exp_name: c_name, exp_schema: schema})
@pytest.mark.tags(CaseLabel.L1) @pytest.mark.tags(CaseLabel.L1)
def test_collection_mix_vectors(self): def test_collection_mix_vectors(self):
""" """
target: test collection with mix vectors target: test collection with mix vectors
method: create with float and binary vec method: create with float and binary vec
expected: raise exception expected: Collection created successfully
""" """
self._connect() self._connect()
c_name = cf.gen_unique_str(prefix) c_name = cf.gen_unique_str(prefix)
fields = [cf.gen_int64_field(is_primary=True), cf.gen_float_vec_field(), cf.gen_binary_vec_field()] fields = [cf.gen_int64_field(is_primary=True), cf.gen_float_vec_field(), cf.gen_binary_vec_field()]
schema = cf.gen_collection_schema(fields=fields, auto_id=True) schema = cf.gen_collection_schema(fields=fields, auto_id=True)
err_msg = "multiple vector fields is not supported" self.collection_wrap.init_collection(c_name, schema=schema,
self.collection_wrap.init_collection(c_name, schema=schema, check_task=CheckTasks.err_res, check_task=CheckTasks.check_collection_property,
check_items={"err_code": 1, "err_msg": err_msg}) check_items={exp_name: c_name, exp_schema: schema})
@pytest.mark.tags(CaseLabel.L0) @pytest.mark.tags(CaseLabel.L0)
def test_collection_without_vectors(self): def test_collection_without_vectors(self):

View File

@ -244,8 +244,8 @@ class TestIndexOperation(TestcaseBase):
collection_w.create_index(ct.default_int64_field_name, {}) collection_w.create_index(ct.default_int64_field_name, {})
collection_w.load(check_task=CheckTasks.err_res, collection_w.load(check_task=CheckTasks.err_res,
check_items={ct.err_code: 65535, check_items={ct.err_code: 65535,
ct.err_msg: f"there is no vector index on collection: {collection_w.name}, " ct.err_msg: f"there is no vector index on field: [float_vector], "
f"please create index firstly"}) f"please create index firstly: collection={collection_w.name}: index not found"})
@pytest.mark.tags(CaseLabel.L2) @pytest.mark.tags(CaseLabel.L2)
def test_index_create_on_array_field(self): def test_index_create_on_array_field(self):