enhance: add `max insert request size` and `must use partition key` configs (#32433)

issue: https://github.com/milvus-io/milvus/issues/30577
/kind improvement

Signed-off-by: SimFG <bang.fu@zilliz.com>
pull/32450/head
SimFG 2024-04-19 10:31:20 +08:00 committed by GitHub
parent 31a29a2451
commit 8594b55ad5
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
17 changed files with 128 additions and 10 deletions

View File

@ -2801,6 +2801,7 @@ func (node *Proxy) search(ctx context.Context, request *milvuspb.SearchRequest)
node: node, node: node,
lb: node.lbPolicy, lb: node.lbPolicy,
enableMaterializedView: node.enableMaterializedView, enableMaterializedView: node.enableMaterializedView,
mustUsePartitionKey: Params.ProxyCfg.MustUsePartitionKey.GetAsBool(),
} }
guaranteeTs := request.GuaranteeTimestamp guaranteeTs := request.GuaranteeTimestamp
@ -3002,6 +3003,7 @@ func (node *Proxy) hybridSearch(ctx context.Context, request *milvuspb.HybridSea
qc: node.queryCoord, qc: node.queryCoord,
node: node, node: node,
lb: node.lbPolicy, lb: node.lbPolicy,
mustUsePartitionKey: Params.ProxyCfg.MustUsePartitionKey.GetAsBool(),
} }
guaranteeTs := request.GuaranteeTimestamp guaranteeTs := request.GuaranteeTimestamp
@ -3414,6 +3416,7 @@ func (node *Proxy) Query(ctx context.Context, request *milvuspb.QueryRequest) (*
request: request, request: request,
qc: node.queryCoord, qc: node.queryCoord,
lb: node.lbPolicy, lb: node.lbPolicy,
mustUsePartitionKey: Params.ProxyCfg.MustUsePartitionKey.GetAsBool(),
} }
res, err := node.query(ctx, qt) res, err := node.query(ctx, qt)
if merr.Ok(res.Status) && err == nil { if merr.Ok(res.Status) && err == nil {

View File

@ -1590,6 +1590,14 @@ func TestProxy(t *testing.T) {
resp, err := proxy.Search(ctx, req) resp, err := proxy.Search(ctx, req)
assert.NoError(t, err) assert.NoError(t, err)
assert.Equal(t, commonpb.ErrorCode_Success, resp.Status.ErrorCode) assert.Equal(t, commonpb.ErrorCode_Success, resp.Status.ErrorCode)
{
Params.Save(Params.ProxyCfg.MustUsePartitionKey.Key, "true")
resp, err := proxy.Search(ctx, req)
assert.NoError(t, err)
assert.NotEqual(t, commonpb.ErrorCode_Success, resp.Status.ErrorCode)
Params.Reset(Params.ProxyCfg.MustUsePartitionKey.Key)
}
}) })
constructAdvancedSearchRequest := func() *milvuspb.SearchRequest { constructAdvancedSearchRequest := func() *milvuspb.SearchRequest {

View File

@ -212,6 +212,12 @@ func (t *createCollectionTask) validatePartitionKey() error {
} }
} }
mustPartitionKey := Params.ProxyCfg.MustUsePartitionKey.GetAsBool()
if mustPartitionKey && idx == -1 {
return merr.WrapErrParameterInvalidMsg("partition key must be set when creating the collection" +
" because the mustUsePartitionKey config is true")
}
if idx == -1 { if idx == -1 {
if t.GetNumPartitions() != 0 { if t.GetNumPartitions() != 0 {
return fmt.Errorf("num_partitions should only be specified with partition key field enabled") return fmt.Errorf("num_partitions should only be specified with partition key field enabled")

View File

@ -112,6 +112,13 @@ func (it *insertTask) PreExecute(ctx context.Context) error {
return err return err
} }
maxInsertSize := Params.QuotaConfig.MaxInsertSize.GetAsInt()
if maxInsertSize != -1 && it.insertMsg.Size() > maxInsertSize {
log.Warn("insert request size exceeds maxInsertSize",
zap.Int("request size", it.insertMsg.Size()), zap.Int("maxInsertSize", maxInsertSize))
return merr.WrapErrParameterTooLarge("insert request size exceeds maxInsertSize")
}
schema, err := globalMetaCache.GetCollectionSchema(ctx, it.insertMsg.GetDbName(), collectionName) schema, err := globalMetaCache.GetCollectionSchema(ctx, it.insertMsg.GetDbName(), collectionName)
if err != nil { if err != nil {
log.Warn("get collection schema from global meta cache failed", zap.String("collectionName", collectionName), zap.Error(err)) log.Warn("get collection schema from global meta cache failed", zap.String("collectionName", collectionName), zap.Error(err))

View File

@ -11,6 +11,8 @@ import (
"github.com/milvus-io/milvus-proto/go-api/v2/msgpb" "github.com/milvus-io/milvus-proto/go-api/v2/msgpb"
"github.com/milvus-io/milvus-proto/go-api/v2/schemapb" "github.com/milvus-io/milvus-proto/go-api/v2/schemapb"
"github.com/milvus-io/milvus/pkg/mq/msgstream" "github.com/milvus-io/milvus/pkg/mq/msgstream"
"github.com/milvus-io/milvus/pkg/util/merr"
"github.com/milvus-io/milvus/pkg/util/paramtable"
) )
func TestInsertTask_CheckAligned(t *testing.T) { func TestInsertTask_CheckAligned(t *testing.T) {
@ -285,3 +287,23 @@ func TestInsertTask(t *testing.T) {
assert.ElementsMatch(t, channels, it.pChannels) assert.ElementsMatch(t, channels, it.pChannels)
}) })
} }
func TestMaxInsertSize(t *testing.T) {
t.Run("test MaxInsertSize", func(t *testing.T) {
paramtable.Init()
Params.Save(Params.QuotaConfig.MaxInsertSize.Key, "1")
defer Params.Reset(Params.QuotaConfig.MaxInsertSize.Key)
it := insertTask{
ctx: context.Background(),
insertMsg: &msgstream.InsertMsg{
InsertRequest: msgpb.InsertRequest{
DbName: "hooooooo",
CollectionName: "fooooo",
},
},
}
err := it.PreExecute(context.Background())
assert.Error(t, err)
assert.ErrorIs(t, err, merr.ErrParameterTooLarge)
})
}

View File

@ -68,6 +68,7 @@ type queryTask struct {
reQuery bool reQuery bool
allQueryCnt int64 allQueryCnt int64
totalRelatedDataSize int64 totalRelatedDataSize int64
mustUsePartitionKey bool
} }
type queryParams struct { type queryParams struct {
@ -303,6 +304,10 @@ func (t *queryTask) PreExecute(ctx context.Context) error {
if t.partitionKeyMode && len(t.request.GetPartitionNames()) != 0 { if t.partitionKeyMode && len(t.request.GetPartitionNames()) != 0 {
return errors.New("not support manually specifying the partition names if partition key mode is used") return errors.New("not support manually specifying the partition names if partition key mode is used")
} }
if t.mustUsePartitionKey && !t.partitionKeyMode {
return merr.WrapErrParameterInvalidMsg("must use partition key in the query request " +
"because the mustUsePartitionKey config is true")
}
for _, tag := range t.request.PartitionNames { for _, tag := range t.request.PartitionNames {
if err := validatePartitionTag(tag, false); err != nil { if err := validatePartitionTag(tag, false); err != nil {

View File

@ -170,6 +170,15 @@ func TestQueryTask_all(t *testing.T) {
assert.Equal(t, typeutil.ZeroTimestamp, task.TimeoutTimestamp) assert.Equal(t, typeutil.ZeroTimestamp, task.TimeoutTimestamp)
task.ctx = ctx1 task.ctx = ctx1
assert.NoError(t, task.PreExecute(ctx)) assert.NoError(t, task.PreExecute(ctx))
{
task.mustUsePartitionKey = true
err := task.PreExecute(ctx)
assert.Error(t, err)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
task.mustUsePartitionKey = false
}
// after preExecute // after preExecute
assert.Greater(t, task.TimeoutTimestamp, typeutil.ZeroTimestamp) assert.Greater(t, task.TimeoutTimestamp, typeutil.ZeroTimestamp)

View File

@ -61,6 +61,7 @@ type searchTask struct {
requery bool requery bool
partitionKeyMode bool partitionKeyMode bool
enableMaterializedView bool enableMaterializedView bool
mustUsePartitionKey bool
userOutputFields []string userOutputFields []string
@ -135,6 +136,10 @@ func (t *searchTask) PreExecute(ctx context.Context) error {
if t.partitionKeyMode && len(t.request.GetPartitionNames()) != 0 { if t.partitionKeyMode && len(t.request.GetPartitionNames()) != 0 {
return errors.New("not support manually specifying the partition names if partition key mode is used") return errors.New("not support manually specifying the partition names if partition key mode is used")
} }
if t.mustUsePartitionKey && !t.partitionKeyMode {
return merr.WrapErrParameterInvalidMsg("must use partition key in the search request " +
"because the mustUsePartitionKey config is true")
}
if !t.partitionKeyMode && len(t.request.GetPartitionNames()) > 0 { if !t.partitionKeyMode && len(t.request.GetPartitionNames()) > 0 {
// translate partition name to partition ids. Use regex-pattern to match partition name. // translate partition name to partition ids. Use regex-pattern to match partition name.

View File

@ -328,6 +328,14 @@ func TestSearchTask_PreExecute(t *testing.T) {
assert.NoError(t, task.PreExecute(ctx)) assert.NoError(t, task.PreExecute(ctx))
assert.Greater(t, task.TimeoutTimestamp, typeutil.ZeroTimestamp) assert.Greater(t, task.TimeoutTimestamp, typeutil.ZeroTimestamp)
{
task.mustUsePartitionKey = true
err = task.PreExecute(ctx)
assert.Error(t, err)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
task.mustUsePartitionKey = false
}
// field not exist // field not exist
task.ctx = context.TODO() task.ctx = context.TODO()
task.request.OutputFields = []string{testInt64Field + funcutil.GenRandomStr()} task.request.OutputFields = []string{testInt64Field + funcutil.GenRandomStr()}

View File

@ -696,6 +696,12 @@ func TestCreateCollectionTask(t *testing.T) {
err = task.PreExecute(ctx) err = task.PreExecute(ctx)
assert.NoError(t, err) assert.NoError(t, err)
Params.Save(Params.ProxyCfg.MustUsePartitionKey.Key, "true")
err = task.PreExecute(ctx)
assert.Error(t, err)
assert.ErrorIs(t, err, merr.ErrParameterInvalid)
Params.Reset(Params.ProxyCfg.MustUsePartitionKey.Key)
task.Schema = []byte{0x1, 0x2, 0x3, 0x4} task.Schema = []byte{0x1, 0x2, 0x3, 0x4}
err = task.PreExecute(ctx) err = task.PreExecute(ctx)
assert.Error(t, err) assert.Error(t, err)

View File

@ -111,6 +111,7 @@ var (
// Parameter related // Parameter related
ErrParameterInvalid = newMilvusError("invalid parameter", 1100, false) ErrParameterInvalid = newMilvusError("invalid parameter", 1100, false)
ErrParameterMissing = newMilvusError("missing parameter", 1101, false) ErrParameterMissing = newMilvusError("missing parameter", 1101, false)
ErrParameterTooLarge = newMilvusError("parameter too large", 1102, false)
// Metrics related // Metrics related
ErrMetricNotFound = newMilvusError("metric not found", 1200, false) ErrMetricNotFound = newMilvusError("metric not found", 1200, false)

View File

@ -136,6 +136,7 @@ func (s *ErrSuite) TestWrap() {
s.ErrorIs(WrapErrParameterInvalid(8, 1, "failed to create"), ErrParameterInvalid) s.ErrorIs(WrapErrParameterInvalid(8, 1, "failed to create"), ErrParameterInvalid)
s.ErrorIs(WrapErrParameterInvalidRange(1, 1<<16, 0, "topk should be in range"), ErrParameterInvalid) s.ErrorIs(WrapErrParameterInvalidRange(1, 1<<16, 0, "topk should be in range"), ErrParameterInvalid)
s.ErrorIs(WrapErrParameterMissing("alias_name", "no alias parameter"), ErrParameterMissing) s.ErrorIs(WrapErrParameterMissing("alias_name", "no alias parameter"), ErrParameterMissing)
s.ErrorIs(WrapErrParameterTooLarge("unit test"), ErrParameterTooLarge)
// Metrics related // Metrics related
s.ErrorIs(WrapErrMetricNotFound("unknown", "failed to get metric"), ErrMetricNotFound) s.ErrorIs(WrapErrMetricNotFound("unknown", "failed to get metric"), ErrMetricNotFound)

View File

@ -863,6 +863,14 @@ func WrapErrParameterMissing[T any](param T, msg ...string) error {
return err return err
} }
func WrapErrParameterTooLarge(name string, msg ...string) error {
err := wrapFields(ErrParameterTooLarge, value("message", name))
if len(msg) > 0 {
err = errors.Wrap(err, strings.Join(msg, "->"))
}
return err
}
// Metrics related // Metrics related
func WrapErrMetricNotFound(name string, msg ...string) error { func WrapErrMetricNotFound(name string, msg ...string) error {
err := wrapFields(ErrMetricNotFound, value("metric", name)) err := wrapFields(ErrMetricNotFound, value("metric", name))

View File

@ -1011,6 +1011,7 @@ type proxyConfig struct {
RetryTimesOnReplica ParamItem `refreshable:"true"` RetryTimesOnReplica ParamItem `refreshable:"true"`
RetryTimesOnHealthCheck ParamItem `refreshable:"true"` RetryTimesOnHealthCheck ParamItem `refreshable:"true"`
PartitionNameRegexp ParamItem `refreshable:"true"` PartitionNameRegexp ParamItem `refreshable:"true"`
MustUsePartitionKey ParamItem `refreshable:"true"`
AccessLog AccessLogConfig AccessLog AccessLogConfig
@ -1338,6 +1339,15 @@ please adjust in embedded Milvus: false`,
} }
p.PartitionNameRegexp.Init(base.mgr) p.PartitionNameRegexp.Init(base.mgr)
p.MustUsePartitionKey = ParamItem{
Key: "proxy.mustUsePartitionKey",
Version: "2.4.1",
DefaultValue: "false",
Doc: "switch for whether proxy must use partition key for the collection",
Export: true,
}
p.MustUsePartitionKey.Init(base.mgr)
p.GracefulStopTimeout = ParamItem{ p.GracefulStopTimeout = ParamItem{
Key: "proxy.gracefulStopTimeout", Key: "proxy.gracefulStopTimeout",
Version: "2.3.7", Version: "2.3.7",

View File

@ -170,6 +170,10 @@ func TestComponentParam(t *testing.T) {
params.Save("proxy.gracefulStopTimeout", "100") params.Save("proxy.gracefulStopTimeout", "100")
assert.Equal(t, 100*time.Second, Params.GracefulStopTimeout.GetAsDuration(time.Second)) assert.Equal(t, 100*time.Second, Params.GracefulStopTimeout.GetAsDuration(time.Second))
assert.False(t, Params.MustUsePartitionKey.GetAsBool())
params.Save("proxy.mustUsePartitionKey", "true")
assert.True(t, Params.MustUsePartitionKey.GetAsBool())
}) })
// t.Run("test proxyConfig panic", func(t *testing.T) { // t.Run("test proxyConfig panic", func(t *testing.T) {

View File

@ -128,6 +128,7 @@ type quotaConfig struct {
NQLimit ParamItem `refreshable:"true"` NQLimit ParamItem `refreshable:"true"`
MaxQueryResultWindow ParamItem `refreshable:"true"` MaxQueryResultWindow ParamItem `refreshable:"true"`
MaxOutputSize ParamItem `refreshable:"true"` MaxOutputSize ParamItem `refreshable:"true"`
MaxInsertSize ParamItem `refreshable:"true"`
MaxResourceGroupNumOfQueryNode ParamItem `refreshable:"true"` MaxResourceGroupNumOfQueryNode ParamItem `refreshable:"true"`
// limit writing // limit writing
@ -1537,6 +1538,15 @@ Check https://milvus.io/docs/limitations.md for more details.`,
} }
p.MaxOutputSize.Init(base.mgr) p.MaxOutputSize.Init(base.mgr)
p.MaxInsertSize = ParamItem{
Key: "quotaAndLimits.limits.maxInsertSize",
Version: "2.4.1",
DefaultValue: "-1", // -1 means no limit, the unit is byte
Doc: `maximum size of a single insert request, in bytes, -1 means no limit`,
Export: true,
}
p.MaxInsertSize.Init(base.mgr)
p.MaxResourceGroupNumOfQueryNode = ParamItem{ p.MaxResourceGroupNumOfQueryNode = ParamItem{
Key: "quotaAndLimits.limits.maxResourceGroupNumOfQueryNode", Key: "quotaAndLimits.limits.maxResourceGroupNumOfQueryNode",
Version: "2.4.1", Version: "2.4.1",

View File

@ -175,11 +175,16 @@ func TestQuotaParam(t *testing.T) {
}) })
t.Run("test limits", func(t *testing.T) { t.Run("test limits", func(t *testing.T) {
params.Init(NewBaseTable(SkipRemote(true)))
assert.Equal(t, 65536, qc.MaxCollectionNum.GetAsInt()) assert.Equal(t, 65536, qc.MaxCollectionNum.GetAsInt())
assert.Equal(t, 65536, qc.MaxCollectionNumPerDB.GetAsInt()) assert.Equal(t, 65536, qc.MaxCollectionNumPerDB.GetAsInt())
assert.Equal(t, 1024, params.QuotaConfig.MaxResourceGroupNumOfQueryNode.GetAsInt()) assert.Equal(t, 1024, params.QuotaConfig.MaxResourceGroupNumOfQueryNode.GetAsInt())
params.Save(params.QuotaConfig.MaxResourceGroupNumOfQueryNode.Key, "512") params.Save(params.QuotaConfig.MaxResourceGroupNumOfQueryNode.Key, "512")
assert.Equal(t, 512, params.QuotaConfig.MaxResourceGroupNumOfQueryNode.GetAsInt()) assert.Equal(t, 512, params.QuotaConfig.MaxResourceGroupNumOfQueryNode.GetAsInt())
assert.Equal(t, -1, qc.MaxInsertSize.GetAsInt())
baseParams.Save(params.QuotaConfig.MaxInsertSize.Key, "1024")
assert.Equal(t, 1024, qc.MaxInsertSize.GetAsInt())
}) })
t.Run("test limit writing", func(t *testing.T) { t.Run("test limit writing", func(t *testing.T) {