mirror of https://github.com/milvus-io/milvus.git
enhance: add `max insert request size` and `must use partition key` configs (#32433)
issue: https://github.com/milvus-io/milvus/issues/30577 /kind improvement Signed-off-by: SimFG <bang.fu@zilliz.com>pull/32450/head
parent
31a29a2451
commit
8594b55ad5
|
@ -2801,6 +2801,7 @@ func (node *Proxy) search(ctx context.Context, request *milvuspb.SearchRequest)
|
||||||
node: node,
|
node: node,
|
||||||
lb: node.lbPolicy,
|
lb: node.lbPolicy,
|
||||||
enableMaterializedView: node.enableMaterializedView,
|
enableMaterializedView: node.enableMaterializedView,
|
||||||
|
mustUsePartitionKey: Params.ProxyCfg.MustUsePartitionKey.GetAsBool(),
|
||||||
}
|
}
|
||||||
|
|
||||||
guaranteeTs := request.GuaranteeTimestamp
|
guaranteeTs := request.GuaranteeTimestamp
|
||||||
|
@ -3002,6 +3003,7 @@ func (node *Proxy) hybridSearch(ctx context.Context, request *milvuspb.HybridSea
|
||||||
qc: node.queryCoord,
|
qc: node.queryCoord,
|
||||||
node: node,
|
node: node,
|
||||||
lb: node.lbPolicy,
|
lb: node.lbPolicy,
|
||||||
|
mustUsePartitionKey: Params.ProxyCfg.MustUsePartitionKey.GetAsBool(),
|
||||||
}
|
}
|
||||||
|
|
||||||
guaranteeTs := request.GuaranteeTimestamp
|
guaranteeTs := request.GuaranteeTimestamp
|
||||||
|
@ -3414,6 +3416,7 @@ func (node *Proxy) Query(ctx context.Context, request *milvuspb.QueryRequest) (*
|
||||||
request: request,
|
request: request,
|
||||||
qc: node.queryCoord,
|
qc: node.queryCoord,
|
||||||
lb: node.lbPolicy,
|
lb: node.lbPolicy,
|
||||||
|
mustUsePartitionKey: Params.ProxyCfg.MustUsePartitionKey.GetAsBool(),
|
||||||
}
|
}
|
||||||
res, err := node.query(ctx, qt)
|
res, err := node.query(ctx, qt)
|
||||||
if merr.Ok(res.Status) && err == nil {
|
if merr.Ok(res.Status) && err == nil {
|
||||||
|
|
|
@ -1590,6 +1590,14 @@ func TestProxy(t *testing.T) {
|
||||||
resp, err := proxy.Search(ctx, req)
|
resp, err := proxy.Search(ctx, req)
|
||||||
assert.NoError(t, err)
|
assert.NoError(t, err)
|
||||||
assert.Equal(t, commonpb.ErrorCode_Success, resp.Status.ErrorCode)
|
assert.Equal(t, commonpb.ErrorCode_Success, resp.Status.ErrorCode)
|
||||||
|
|
||||||
|
{
|
||||||
|
Params.Save(Params.ProxyCfg.MustUsePartitionKey.Key, "true")
|
||||||
|
resp, err := proxy.Search(ctx, req)
|
||||||
|
assert.NoError(t, err)
|
||||||
|
assert.NotEqual(t, commonpb.ErrorCode_Success, resp.Status.ErrorCode)
|
||||||
|
Params.Reset(Params.ProxyCfg.MustUsePartitionKey.Key)
|
||||||
|
}
|
||||||
})
|
})
|
||||||
|
|
||||||
constructAdvancedSearchRequest := func() *milvuspb.SearchRequest {
|
constructAdvancedSearchRequest := func() *milvuspb.SearchRequest {
|
||||||
|
|
|
@ -212,6 +212,12 @@ func (t *createCollectionTask) validatePartitionKey() error {
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
mustPartitionKey := Params.ProxyCfg.MustUsePartitionKey.GetAsBool()
|
||||||
|
if mustPartitionKey && idx == -1 {
|
||||||
|
return merr.WrapErrParameterInvalidMsg("partition key must be set when creating the collection" +
|
||||||
|
" because the mustUsePartitionKey config is true")
|
||||||
|
}
|
||||||
|
|
||||||
if idx == -1 {
|
if idx == -1 {
|
||||||
if t.GetNumPartitions() != 0 {
|
if t.GetNumPartitions() != 0 {
|
||||||
return fmt.Errorf("num_partitions should only be specified with partition key field enabled")
|
return fmt.Errorf("num_partitions should only be specified with partition key field enabled")
|
||||||
|
|
|
@ -112,6 +112,13 @@ func (it *insertTask) PreExecute(ctx context.Context) error {
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
|
maxInsertSize := Params.QuotaConfig.MaxInsertSize.GetAsInt()
|
||||||
|
if maxInsertSize != -1 && it.insertMsg.Size() > maxInsertSize {
|
||||||
|
log.Warn("insert request size exceeds maxInsertSize",
|
||||||
|
zap.Int("request size", it.insertMsg.Size()), zap.Int("maxInsertSize", maxInsertSize))
|
||||||
|
return merr.WrapErrParameterTooLarge("insert request size exceeds maxInsertSize")
|
||||||
|
}
|
||||||
|
|
||||||
schema, err := globalMetaCache.GetCollectionSchema(ctx, it.insertMsg.GetDbName(), collectionName)
|
schema, err := globalMetaCache.GetCollectionSchema(ctx, it.insertMsg.GetDbName(), collectionName)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
log.Warn("get collection schema from global meta cache failed", zap.String("collectionName", collectionName), zap.Error(err))
|
log.Warn("get collection schema from global meta cache failed", zap.String("collectionName", collectionName), zap.Error(err))
|
||||||
|
|
|
@ -11,6 +11,8 @@ import (
|
||||||
"github.com/milvus-io/milvus-proto/go-api/v2/msgpb"
|
"github.com/milvus-io/milvus-proto/go-api/v2/msgpb"
|
||||||
"github.com/milvus-io/milvus-proto/go-api/v2/schemapb"
|
"github.com/milvus-io/milvus-proto/go-api/v2/schemapb"
|
||||||
"github.com/milvus-io/milvus/pkg/mq/msgstream"
|
"github.com/milvus-io/milvus/pkg/mq/msgstream"
|
||||||
|
"github.com/milvus-io/milvus/pkg/util/merr"
|
||||||
|
"github.com/milvus-io/milvus/pkg/util/paramtable"
|
||||||
)
|
)
|
||||||
|
|
||||||
func TestInsertTask_CheckAligned(t *testing.T) {
|
func TestInsertTask_CheckAligned(t *testing.T) {
|
||||||
|
@ -285,3 +287,23 @@ func TestInsertTask(t *testing.T) {
|
||||||
assert.ElementsMatch(t, channels, it.pChannels)
|
assert.ElementsMatch(t, channels, it.pChannels)
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func TestMaxInsertSize(t *testing.T) {
|
||||||
|
t.Run("test MaxInsertSize", func(t *testing.T) {
|
||||||
|
paramtable.Init()
|
||||||
|
Params.Save(Params.QuotaConfig.MaxInsertSize.Key, "1")
|
||||||
|
defer Params.Reset(Params.QuotaConfig.MaxInsertSize.Key)
|
||||||
|
it := insertTask{
|
||||||
|
ctx: context.Background(),
|
||||||
|
insertMsg: &msgstream.InsertMsg{
|
||||||
|
InsertRequest: msgpb.InsertRequest{
|
||||||
|
DbName: "hooooooo",
|
||||||
|
CollectionName: "fooooo",
|
||||||
|
},
|
||||||
|
},
|
||||||
|
}
|
||||||
|
err := it.PreExecute(context.Background())
|
||||||
|
assert.Error(t, err)
|
||||||
|
assert.ErrorIs(t, err, merr.ErrParameterTooLarge)
|
||||||
|
})
|
||||||
|
}
|
||||||
|
|
|
@ -68,6 +68,7 @@ type queryTask struct {
|
||||||
reQuery bool
|
reQuery bool
|
||||||
allQueryCnt int64
|
allQueryCnt int64
|
||||||
totalRelatedDataSize int64
|
totalRelatedDataSize int64
|
||||||
|
mustUsePartitionKey bool
|
||||||
}
|
}
|
||||||
|
|
||||||
type queryParams struct {
|
type queryParams struct {
|
||||||
|
@ -303,6 +304,10 @@ func (t *queryTask) PreExecute(ctx context.Context) error {
|
||||||
if t.partitionKeyMode && len(t.request.GetPartitionNames()) != 0 {
|
if t.partitionKeyMode && len(t.request.GetPartitionNames()) != 0 {
|
||||||
return errors.New("not support manually specifying the partition names if partition key mode is used")
|
return errors.New("not support manually specifying the partition names if partition key mode is used")
|
||||||
}
|
}
|
||||||
|
if t.mustUsePartitionKey && !t.partitionKeyMode {
|
||||||
|
return merr.WrapErrParameterInvalidMsg("must use partition key in the query request " +
|
||||||
|
"because the mustUsePartitionKey config is true")
|
||||||
|
}
|
||||||
|
|
||||||
for _, tag := range t.request.PartitionNames {
|
for _, tag := range t.request.PartitionNames {
|
||||||
if err := validatePartitionTag(tag, false); err != nil {
|
if err := validatePartitionTag(tag, false); err != nil {
|
||||||
|
|
|
@ -170,6 +170,15 @@ func TestQueryTask_all(t *testing.T) {
|
||||||
assert.Equal(t, typeutil.ZeroTimestamp, task.TimeoutTimestamp)
|
assert.Equal(t, typeutil.ZeroTimestamp, task.TimeoutTimestamp)
|
||||||
task.ctx = ctx1
|
task.ctx = ctx1
|
||||||
assert.NoError(t, task.PreExecute(ctx))
|
assert.NoError(t, task.PreExecute(ctx))
|
||||||
|
|
||||||
|
{
|
||||||
|
task.mustUsePartitionKey = true
|
||||||
|
err := task.PreExecute(ctx)
|
||||||
|
assert.Error(t, err)
|
||||||
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
||||||
|
task.mustUsePartitionKey = false
|
||||||
|
}
|
||||||
|
|
||||||
// after preExecute
|
// after preExecute
|
||||||
assert.Greater(t, task.TimeoutTimestamp, typeutil.ZeroTimestamp)
|
assert.Greater(t, task.TimeoutTimestamp, typeutil.ZeroTimestamp)
|
||||||
|
|
||||||
|
|
|
@ -61,6 +61,7 @@ type searchTask struct {
|
||||||
requery bool
|
requery bool
|
||||||
partitionKeyMode bool
|
partitionKeyMode bool
|
||||||
enableMaterializedView bool
|
enableMaterializedView bool
|
||||||
|
mustUsePartitionKey bool
|
||||||
|
|
||||||
userOutputFields []string
|
userOutputFields []string
|
||||||
|
|
||||||
|
@ -135,6 +136,10 @@ func (t *searchTask) PreExecute(ctx context.Context) error {
|
||||||
if t.partitionKeyMode && len(t.request.GetPartitionNames()) != 0 {
|
if t.partitionKeyMode && len(t.request.GetPartitionNames()) != 0 {
|
||||||
return errors.New("not support manually specifying the partition names if partition key mode is used")
|
return errors.New("not support manually specifying the partition names if partition key mode is used")
|
||||||
}
|
}
|
||||||
|
if t.mustUsePartitionKey && !t.partitionKeyMode {
|
||||||
|
return merr.WrapErrParameterInvalidMsg("must use partition key in the search request " +
|
||||||
|
"because the mustUsePartitionKey config is true")
|
||||||
|
}
|
||||||
|
|
||||||
if !t.partitionKeyMode && len(t.request.GetPartitionNames()) > 0 {
|
if !t.partitionKeyMode && len(t.request.GetPartitionNames()) > 0 {
|
||||||
// translate partition name to partition ids. Use regex-pattern to match partition name.
|
// translate partition name to partition ids. Use regex-pattern to match partition name.
|
||||||
|
|
|
@ -328,6 +328,14 @@ func TestSearchTask_PreExecute(t *testing.T) {
|
||||||
assert.NoError(t, task.PreExecute(ctx))
|
assert.NoError(t, task.PreExecute(ctx))
|
||||||
assert.Greater(t, task.TimeoutTimestamp, typeutil.ZeroTimestamp)
|
assert.Greater(t, task.TimeoutTimestamp, typeutil.ZeroTimestamp)
|
||||||
|
|
||||||
|
{
|
||||||
|
task.mustUsePartitionKey = true
|
||||||
|
err = task.PreExecute(ctx)
|
||||||
|
assert.Error(t, err)
|
||||||
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
||||||
|
task.mustUsePartitionKey = false
|
||||||
|
}
|
||||||
|
|
||||||
// field not exist
|
// field not exist
|
||||||
task.ctx = context.TODO()
|
task.ctx = context.TODO()
|
||||||
task.request.OutputFields = []string{testInt64Field + funcutil.GenRandomStr()}
|
task.request.OutputFields = []string{testInt64Field + funcutil.GenRandomStr()}
|
||||||
|
|
|
@ -696,6 +696,12 @@ func TestCreateCollectionTask(t *testing.T) {
|
||||||
err = task.PreExecute(ctx)
|
err = task.PreExecute(ctx)
|
||||||
assert.NoError(t, err)
|
assert.NoError(t, err)
|
||||||
|
|
||||||
|
Params.Save(Params.ProxyCfg.MustUsePartitionKey.Key, "true")
|
||||||
|
err = task.PreExecute(ctx)
|
||||||
|
assert.Error(t, err)
|
||||||
|
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
|
||||||
|
Params.Reset(Params.ProxyCfg.MustUsePartitionKey.Key)
|
||||||
|
|
||||||
task.Schema = []byte{0x1, 0x2, 0x3, 0x4}
|
task.Schema = []byte{0x1, 0x2, 0x3, 0x4}
|
||||||
err = task.PreExecute(ctx)
|
err = task.PreExecute(ctx)
|
||||||
assert.Error(t, err)
|
assert.Error(t, err)
|
||||||
|
|
|
@ -111,6 +111,7 @@ var (
|
||||||
// Parameter related
|
// Parameter related
|
||||||
ErrParameterInvalid = newMilvusError("invalid parameter", 1100, false)
|
ErrParameterInvalid = newMilvusError("invalid parameter", 1100, false)
|
||||||
ErrParameterMissing = newMilvusError("missing parameter", 1101, false)
|
ErrParameterMissing = newMilvusError("missing parameter", 1101, false)
|
||||||
|
ErrParameterTooLarge = newMilvusError("parameter too large", 1102, false)
|
||||||
|
|
||||||
// Metrics related
|
// Metrics related
|
||||||
ErrMetricNotFound = newMilvusError("metric not found", 1200, false)
|
ErrMetricNotFound = newMilvusError("metric not found", 1200, false)
|
||||||
|
|
|
@ -136,6 +136,7 @@ func (s *ErrSuite) TestWrap() {
|
||||||
s.ErrorIs(WrapErrParameterInvalid(8, 1, "failed to create"), ErrParameterInvalid)
|
s.ErrorIs(WrapErrParameterInvalid(8, 1, "failed to create"), ErrParameterInvalid)
|
||||||
s.ErrorIs(WrapErrParameterInvalidRange(1, 1<<16, 0, "topk should be in range"), ErrParameterInvalid)
|
s.ErrorIs(WrapErrParameterInvalidRange(1, 1<<16, 0, "topk should be in range"), ErrParameterInvalid)
|
||||||
s.ErrorIs(WrapErrParameterMissing("alias_name", "no alias parameter"), ErrParameterMissing)
|
s.ErrorIs(WrapErrParameterMissing("alias_name", "no alias parameter"), ErrParameterMissing)
|
||||||
|
s.ErrorIs(WrapErrParameterTooLarge("unit test"), ErrParameterTooLarge)
|
||||||
|
|
||||||
// Metrics related
|
// Metrics related
|
||||||
s.ErrorIs(WrapErrMetricNotFound("unknown", "failed to get metric"), ErrMetricNotFound)
|
s.ErrorIs(WrapErrMetricNotFound("unknown", "failed to get metric"), ErrMetricNotFound)
|
||||||
|
|
|
@ -863,6 +863,14 @@ func WrapErrParameterMissing[T any](param T, msg ...string) error {
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func WrapErrParameterTooLarge(name string, msg ...string) error {
|
||||||
|
err := wrapFields(ErrParameterTooLarge, value("message", name))
|
||||||
|
if len(msg) > 0 {
|
||||||
|
err = errors.Wrap(err, strings.Join(msg, "->"))
|
||||||
|
}
|
||||||
|
return err
|
||||||
|
}
|
||||||
|
|
||||||
// Metrics related
|
// Metrics related
|
||||||
func WrapErrMetricNotFound(name string, msg ...string) error {
|
func WrapErrMetricNotFound(name string, msg ...string) error {
|
||||||
err := wrapFields(ErrMetricNotFound, value("metric", name))
|
err := wrapFields(ErrMetricNotFound, value("metric", name))
|
||||||
|
|
|
@ -1011,6 +1011,7 @@ type proxyConfig struct {
|
||||||
RetryTimesOnReplica ParamItem `refreshable:"true"`
|
RetryTimesOnReplica ParamItem `refreshable:"true"`
|
||||||
RetryTimesOnHealthCheck ParamItem `refreshable:"true"`
|
RetryTimesOnHealthCheck ParamItem `refreshable:"true"`
|
||||||
PartitionNameRegexp ParamItem `refreshable:"true"`
|
PartitionNameRegexp ParamItem `refreshable:"true"`
|
||||||
|
MustUsePartitionKey ParamItem `refreshable:"true"`
|
||||||
|
|
||||||
AccessLog AccessLogConfig
|
AccessLog AccessLogConfig
|
||||||
|
|
||||||
|
@ -1338,6 +1339,15 @@ please adjust in embedded Milvus: false`,
|
||||||
}
|
}
|
||||||
p.PartitionNameRegexp.Init(base.mgr)
|
p.PartitionNameRegexp.Init(base.mgr)
|
||||||
|
|
||||||
|
p.MustUsePartitionKey = ParamItem{
|
||||||
|
Key: "proxy.mustUsePartitionKey",
|
||||||
|
Version: "2.4.1",
|
||||||
|
DefaultValue: "false",
|
||||||
|
Doc: "switch for whether proxy must use partition key for the collection",
|
||||||
|
Export: true,
|
||||||
|
}
|
||||||
|
p.MustUsePartitionKey.Init(base.mgr)
|
||||||
|
|
||||||
p.GracefulStopTimeout = ParamItem{
|
p.GracefulStopTimeout = ParamItem{
|
||||||
Key: "proxy.gracefulStopTimeout",
|
Key: "proxy.gracefulStopTimeout",
|
||||||
Version: "2.3.7",
|
Version: "2.3.7",
|
||||||
|
|
|
@ -170,6 +170,10 @@ func TestComponentParam(t *testing.T) {
|
||||||
|
|
||||||
params.Save("proxy.gracefulStopTimeout", "100")
|
params.Save("proxy.gracefulStopTimeout", "100")
|
||||||
assert.Equal(t, 100*time.Second, Params.GracefulStopTimeout.GetAsDuration(time.Second))
|
assert.Equal(t, 100*time.Second, Params.GracefulStopTimeout.GetAsDuration(time.Second))
|
||||||
|
|
||||||
|
assert.False(t, Params.MustUsePartitionKey.GetAsBool())
|
||||||
|
params.Save("proxy.mustUsePartitionKey", "true")
|
||||||
|
assert.True(t, Params.MustUsePartitionKey.GetAsBool())
|
||||||
})
|
})
|
||||||
|
|
||||||
// t.Run("test proxyConfig panic", func(t *testing.T) {
|
// t.Run("test proxyConfig panic", func(t *testing.T) {
|
||||||
|
|
|
@ -128,6 +128,7 @@ type quotaConfig struct {
|
||||||
NQLimit ParamItem `refreshable:"true"`
|
NQLimit ParamItem `refreshable:"true"`
|
||||||
MaxQueryResultWindow ParamItem `refreshable:"true"`
|
MaxQueryResultWindow ParamItem `refreshable:"true"`
|
||||||
MaxOutputSize ParamItem `refreshable:"true"`
|
MaxOutputSize ParamItem `refreshable:"true"`
|
||||||
|
MaxInsertSize ParamItem `refreshable:"true"`
|
||||||
MaxResourceGroupNumOfQueryNode ParamItem `refreshable:"true"`
|
MaxResourceGroupNumOfQueryNode ParamItem `refreshable:"true"`
|
||||||
|
|
||||||
// limit writing
|
// limit writing
|
||||||
|
@ -1537,6 +1538,15 @@ Check https://milvus.io/docs/limitations.md for more details.`,
|
||||||
}
|
}
|
||||||
p.MaxOutputSize.Init(base.mgr)
|
p.MaxOutputSize.Init(base.mgr)
|
||||||
|
|
||||||
|
p.MaxInsertSize = ParamItem{
|
||||||
|
Key: "quotaAndLimits.limits.maxInsertSize",
|
||||||
|
Version: "2.4.1",
|
||||||
|
DefaultValue: "-1", // -1 means no limit, the unit is byte
|
||||||
|
Doc: `maximum size of a single insert request, in bytes, -1 means no limit`,
|
||||||
|
Export: true,
|
||||||
|
}
|
||||||
|
p.MaxInsertSize.Init(base.mgr)
|
||||||
|
|
||||||
p.MaxResourceGroupNumOfQueryNode = ParamItem{
|
p.MaxResourceGroupNumOfQueryNode = ParamItem{
|
||||||
Key: "quotaAndLimits.limits.maxResourceGroupNumOfQueryNode",
|
Key: "quotaAndLimits.limits.maxResourceGroupNumOfQueryNode",
|
||||||
Version: "2.4.1",
|
Version: "2.4.1",
|
||||||
|
|
|
@ -175,11 +175,16 @@ func TestQuotaParam(t *testing.T) {
|
||||||
})
|
})
|
||||||
|
|
||||||
t.Run("test limits", func(t *testing.T) {
|
t.Run("test limits", func(t *testing.T) {
|
||||||
|
params.Init(NewBaseTable(SkipRemote(true)))
|
||||||
assert.Equal(t, 65536, qc.MaxCollectionNum.GetAsInt())
|
assert.Equal(t, 65536, qc.MaxCollectionNum.GetAsInt())
|
||||||
assert.Equal(t, 65536, qc.MaxCollectionNumPerDB.GetAsInt())
|
assert.Equal(t, 65536, qc.MaxCollectionNumPerDB.GetAsInt())
|
||||||
assert.Equal(t, 1024, params.QuotaConfig.MaxResourceGroupNumOfQueryNode.GetAsInt())
|
assert.Equal(t, 1024, params.QuotaConfig.MaxResourceGroupNumOfQueryNode.GetAsInt())
|
||||||
params.Save(params.QuotaConfig.MaxResourceGroupNumOfQueryNode.Key, "512")
|
params.Save(params.QuotaConfig.MaxResourceGroupNumOfQueryNode.Key, "512")
|
||||||
assert.Equal(t, 512, params.QuotaConfig.MaxResourceGroupNumOfQueryNode.GetAsInt())
|
assert.Equal(t, 512, params.QuotaConfig.MaxResourceGroupNumOfQueryNode.GetAsInt())
|
||||||
|
|
||||||
|
assert.Equal(t, -1, qc.MaxInsertSize.GetAsInt())
|
||||||
|
baseParams.Save(params.QuotaConfig.MaxInsertSize.Key, "1024")
|
||||||
|
assert.Equal(t, 1024, qc.MaxInsertSize.GetAsInt())
|
||||||
})
|
})
|
||||||
|
|
||||||
t.Run("test limit writing", func(t *testing.T) {
|
t.Run("test limit writing", func(t *testing.T) {
|
||||||
|
|
Loading…
Reference in New Issue