Update quota params and disable limit for showCollection (#19641)

Signed-off-by: bigsheeper <yihao.dai@zilliz.com> Signed-off-by: bigsheeper <yihao.dai@zilliz.com>
2022-10-09 14:30:58 +08:00 · 2022-10-09 14:30:58 +08:00 · f98dbcf5be
parent a85e44d169
commit f98dbcf5be
6 changed files with 82 additions and 82 deletions
--- a/configs/milvus.yaml
+++ b/configs/milvus.yaml
@ -377,43 +377,43 @@ quotaAndLimits:
  enabled: false # `true` to enable quota and limits, `false` to disable.

  # quotaCenterCollectInterval is the time interval that quotaCenter
-  # collects metrics from Query cluster and Data cluster.
+  # collects metrics from Proxies, Query cluster and Data cluster.
  quotaCenterCollectInterval: 3 # seconds, (0 ~ 65536)

  ddl: # ddl limit rates, default no limit.
    enabled: false
-    collectionRate: # requests per minute, default no limit, rate for CreateCollection, DropCollection, HasCollection, DescribeCollection, LoadCollection, ReleaseCollection
-    partitionRate: # requests per minute, default no limit, rate for CreatePartition, DropPartition, HasPartition, LoadPartition, ReleasePartition
-    indexRate: # requests per minute, default no limit, rate for CreateIndex, DropIndex, DescribeIndex
-    flushRate: # requests per minute, default no limit, rate for flush
-    compactionRate: # requests per minute, default no limit, rate for manualCompaction
+    collectionRate: # qps, default no limit, rate for CreateCollection, DropCollection, LoadCollection, ReleaseCollection
+    partitionRate: # qps, default no limit, rate for CreatePartition, DropPartition, LoadPartition, ReleasePartition
+
+  indexRate:
+    enabled: false
+    max: # qps, default no limit, rate for CreateIndex, DropIndex
+  flushRate:
+    enabled: false
+    max: # qps, default no limit, rate for flush
+  compactionRate:
+    enabled: false
+    max: # qps, default no limit, rate for manualCompaction

  # dml limit rates, default no limit.
-  # The maximum rate will not be greater than `max`,
-  # and the rate after handling back pressure will not be less than `min`.
+  # The maximum rate will not be greater than `max`.
  dml:
    enabled: false
    insertRate:
      max: # MB/s, default no limit
-      min: # MB/s, default 0
    deleteRate:
      max: # MB/s, default no limit
-      min: # MB/s, default 0
    bulkLoadRate: # not support yet. TODO: limit bulkLoad rate
      max: # MB/s, default no limit
-      min: # MB/s, default 0

  # dql limit rates, default no limit.
-  # The maximum rate will not be greater than `max`,
-  # and the rate after handling back pressure will not be less than `min`.
+  # The maximum rate will not be greater than `max`.
  dql:
    enabled: false
    searchRate:
      max: # vps (vectors per second), default no limit
-      min: # vps (vectors per second), default 0
    queryRate:
      max: # qps, default no limit
-      min: # qps, default 0

  # limitWriting decides whether dml requests are allowed.
  limitWriting:
@ -432,10 +432,10 @@ quotaAndLimits:
      # When memoryLowWaterLevel < memory usage < memoryHighWaterLevel, reduce the dml rate;
      # When memory usage < memoryLowWaterLevel, no action.
      # memoryLowWaterLevel should be less than memoryHighWaterLevel.
-      dataNodeMemoryLowWaterLevel: 0.8 # (0, 1], memoryLowWaterLevel in DataNodes
-      dataNodeMemoryHighWaterLevel: 0.9 # (0, 1], memoryHighWaterLevel in DataNodes
-      queryNodeMemoryLowWaterLevel: 0.8 # (0, 1], memoryLowWaterLevel in QueryNodes
-      queryNodeMemoryHighWaterLevel: 0.9 # (0, 1], memoryHighWaterLevel in QueryNodes
+      dataNodeMemoryLowWaterLevel: 0.85 # (0, 1], memoryLowWaterLevel in DataNodes
+      dataNodeMemoryHighWaterLevel: 0.95 # (0, 1], memoryHighWaterLevel in DataNodes
+      queryNodeMemoryLowWaterLevel: 0.85 # (0, 1], memoryLowWaterLevel in QueryNodes
+      queryNodeMemoryHighWaterLevel: 0.95 # (0, 1], memoryHighWaterLevel in QueryNodes

  # limitReading decides whether dql requests are allowed.
  limitReading:
--- a/internal/proxy/multi_rate_limiter.go
+++ b/internal/proxy/multi_rate_limiter.go
@ -106,11 +106,11 @@ func (rl *rateLimiter) registerLimiters() {
 		case internalpb.RateType_DDLPartition:
 			r = Params.QuotaConfig.DDLPartitionRate
 		case internalpb.RateType_DDLIndex:
-			r = Params.QuotaConfig.DDLIndexRate
+			r = Params.QuotaConfig.MaxIndexRate
 		case internalpb.RateType_DDLFlush:
-			r = Params.QuotaConfig.DDLFlushRate
+			r = Params.QuotaConfig.MaxFlushRate
 		case internalpb.RateType_DDLCompaction:
-			r = Params.QuotaConfig.DDLCompactionRate
+			r = Params.QuotaConfig.MaxCompactionRate
 		case internalpb.RateType_DMLInsert:
 			r = Params.QuotaConfig.DMLMaxInsertRate
 		case internalpb.RateType_DMLDelete:
--- a/internal/proxy/rate_limit_interceptor.go
+++ b/internal/proxy/rate_limit_interceptor.go
@ -65,15 +65,15 @@ func getRequestInfo(req interface{}) (internalpb.RateType, int, error) {
 		return internalpb.RateType_DQLSearch, int(r.GetNq()), nil
 	case *milvuspb.QueryRequest:
 		return internalpb.RateType_DQLQuery, 1, nil // think of the query request's nq as 1
-	case *milvuspb.CreateCollectionRequest, *milvuspb.DropCollectionRequest, *milvuspb.HasCollectionRequest:
+	case *milvuspb.CreateCollectionRequest, *milvuspb.DropCollectionRequest:
 		return internalpb.RateType_DDLCollection, 1, nil
-	case *milvuspb.LoadCollectionRequest, *milvuspb.ReleaseCollectionRequest, *milvuspb.ShowCollectionsRequest:
+	case *milvuspb.LoadCollectionRequest, *milvuspb.ReleaseCollectionRequest:
 		return internalpb.RateType_DDLCollection, 1, nil
-	case *milvuspb.CreatePartitionRequest, *milvuspb.DropPartitionRequest, *milvuspb.HasPartitionRequest:
+	case *milvuspb.CreatePartitionRequest, *milvuspb.DropPartitionRequest:
 		return internalpb.RateType_DDLPartition, 1, nil
-	case *milvuspb.LoadPartitionsRequest, *milvuspb.ReleasePartitionsRequest, *milvuspb.ShowPartitionsRequest:
+	case *milvuspb.LoadPartitionsRequest, *milvuspb.ReleasePartitionsRequest:
 		return internalpb.RateType_DDLPartition, 1, nil
-	case *milvuspb.CreateIndexRequest, *milvuspb.DropIndexRequest, *milvuspb.DescribeIndexRequest:
+	case *milvuspb.CreateIndexRequest, *milvuspb.DropIndexRequest:
 		return internalpb.RateType_DDLIndex, 1, nil
 	case *milvuspb.FlushRequest:
 		return internalpb.RateType_DDLFlush, 1, nil
@ -130,20 +130,6 @@ func getFailedResponse(req interface{}, code commonpb.ErrorCode, reason string)
 		*milvuspb.LoadPartitionsRequest, *milvuspb.ReleasePartitionsRequest,
 		*milvuspb.CreateIndexRequest, *milvuspb.DropIndexRequest:
 		return failedStatus(code, reason), nil
-	case *milvuspb.HasCollectionRequest, *milvuspb.HasPartitionRequest:
-		return failedBoolResponse(code, reason), nil
-	case *milvuspb.ShowCollectionsRequest:
-		return &milvuspb.ShowCollectionsResponse{
-			Status: failedStatus(code, reason),
-		}, nil
-	case *milvuspb.ShowPartitionsRequest:
-		return &milvuspb.ShowPartitionsResponse{
-			Status: failedStatus(code, reason),
-		}, nil
-	case *milvuspb.DescribeIndexRequest:
-		return &milvuspb.DescribeIndexResponse{
-			Status: failedStatus(code, reason),
-		}, nil
 	case *milvuspb.FlushRequest:
 		return &milvuspb.FlushResponse{
 			Status: failedStatus(code, reason),
--- a/internal/proxy/rate_limit_interceptor_test.go
+++ b/internal/proxy/rate_limit_interceptor_test.go
@ -96,10 +96,6 @@ func TestRateLimitInterceptor(t *testing.T) {
 		testGetFailedResponse(&milvuspb.SearchRequest{})
 		testGetFailedResponse(&milvuspb.QueryRequest{})
 		testGetFailedResponse(&milvuspb.CreateCollectionRequest{})
-		testGetFailedResponse(&milvuspb.HasCollectionRequest{})
-		testGetFailedResponse(&milvuspb.ShowCollectionsRequest{})
-		testGetFailedResponse(&milvuspb.ShowPartitionsRequest{})
-		testGetFailedResponse(&milvuspb.DescribeIndexRequest{})
 		testGetFailedResponse(&milvuspb.FlushRequest{})
 		testGetFailedResponse(&milvuspb.ManualCompactionRequest{})

--- a/internal/util/paramtable/quota_param.go
+++ b/internal/util/paramtable/quota_param.go
@ -32,12 +32,9 @@ const (
 	// defaultMax is the default minimal rate.
 	defaultMin = float64(0)
 	// defaultLowWaterLevel is the default memory low water level.
-	defaultLowWaterLevel = float64(0.8)
+	defaultLowWaterLevel = float64(0.85)
 	// defaultHighWaterLevel is the default memory low water level.
-	defaultHighWaterLevel = float64(0.9)
-
-	// secondsPerMinute is used to convert minutes to seconds.
-	secondsPerMinute = 60.0
+	defaultHighWaterLevel = float64(0.95)
 )

 // quotaConfig is configuration for quota and limitations.
@ -52,9 +49,13 @@ type quotaConfig struct {
 	DDLLimitEnabled   bool
 	DDLCollectionRate float64
 	DDLPartitionRate  float64
-	DDLIndexRate      float64
-	DDLFlushRate      float64
-	DDLCompactionRate float64
+
+	IndexLimitEnabled      bool
+	MaxIndexRate           float64
+	FlushLimitEnabled      bool
+	MaxFlushRate           float64
+	CompactionLimitEnabled bool
+	MaxCompactionRate      float64

 	// dml
 	DMLLimitEnabled    bool
@ -103,9 +104,13 @@ func (p *quotaConfig) init(base *BaseTable) {
 	p.initDDLLimitEnabled()
 	p.initDDLCollectionRate()
 	p.initDDLPartitionRate()
-	p.initDDLIndexRate()
-	p.initDDLFlushRate()
-	p.initDDLCompactionRate()
+
+	p.initIndexLimitEnabled()
+	p.initMaxIndexRate()
+	p.initFlushLimitEnabled()
+	p.initMaxFlushRate()
+	p.initCompactionLimitEnabled()
+	p.initMaxCompactionRate()

 	// dml
 	p.initDMLLimitEnabled()
@ -167,7 +172,6 @@ func (p *quotaConfig) initDDLCollectionRate() {
 		return
 	}
 	p.DDLCollectionRate = p.Base.ParseFloatWithDefault("quotaAndLimits.ddl.collectionRate", defaultMax)
-	p.DDLCollectionRate /= secondsPerMinute
 	// [0 ~ Inf)
 	if p.DDLCollectionRate < 0 {
 		p.DDLCollectionRate = defaultMax
@ -180,49 +184,57 @@ func (p *quotaConfig) initDDLPartitionRate() {
 		return
 	}
 	p.DDLPartitionRate = p.Base.ParseFloatWithDefault("quotaAndLimits.ddl.partitionRate", defaultMax)
-	p.DDLPartitionRate /= secondsPerMinute
 	// [0 ~ Inf)
 	if p.DDLPartitionRate < 0 {
 		p.DDLPartitionRate = defaultMax
 	}
 }

-func (p *quotaConfig) initDDLIndexRate() {
-	if !p.DDLLimitEnabled {
-		p.DDLIndexRate = defaultMax
+func (p *quotaConfig) initIndexLimitEnabled() {
+	p.IndexLimitEnabled = p.Base.ParseBool("quotaAndLimits.indexRate.enabled", false)
+}
+
+func (p *quotaConfig) initMaxIndexRate() {
+	if !p.IndexLimitEnabled {
+		p.MaxIndexRate = defaultMax
 		return
 	}
-	p.DDLIndexRate = p.Base.ParseFloatWithDefault("quotaAndLimits.ddl.indexRate", defaultMax)
-	p.DDLIndexRate /= secondsPerMinute
+	p.MaxIndexRate = p.Base.ParseFloatWithDefault("quotaAndLimits.indexRate.max", defaultMax)
 	// [0 ~ Inf)
-	if p.DDLIndexRate < 0 {
-		p.DDLIndexRate = defaultMax
+	if p.MaxIndexRate < 0 {
+		p.MaxIndexRate = defaultMax
 	}
 }

-func (p *quotaConfig) initDDLFlushRate() {
-	if !p.DDLLimitEnabled {
-		p.DDLFlushRate = defaultMax
+func (p *quotaConfig) initFlushLimitEnabled() {
+	p.FlushLimitEnabled = p.Base.ParseBool("quotaAndLimits.flushRate.enabled", false)
+}
+
+func (p *quotaConfig) initMaxFlushRate() {
+	if !p.FlushLimitEnabled {
+		p.MaxFlushRate = defaultMax
 		return
 	}
-	p.DDLFlushRate = p.Base.ParseFloatWithDefault("quotaAndLimits.ddl.flushRate", defaultMax)
-	p.DDLFlushRate /= secondsPerMinute
+	p.MaxFlushRate = p.Base.ParseFloatWithDefault("quotaAndLimits.flushRate.max", defaultMax)
 	// [0 ~ Inf)
-	if p.DDLFlushRate < 0 {
-		p.DDLFlushRate = defaultMax
+	if p.MaxFlushRate < 0 {
+		p.MaxFlushRate = defaultMax
 	}
 }

-func (p *quotaConfig) initDDLCompactionRate() {
-	if !p.DDLLimitEnabled {
-		p.DDLCompactionRate = defaultMax
+func (p *quotaConfig) initCompactionLimitEnabled() {
+	p.CompactionLimitEnabled = p.Base.ParseBool("quotaAndLimits.compactionRate.enabled", false)
+}
+
+func (p *quotaConfig) initMaxCompactionRate() {
+	if !p.CompactionLimitEnabled {
+		p.MaxCompactionRate = defaultMax
 		return
 	}
-	p.DDLCompactionRate = p.Base.ParseFloatWithDefault("quotaAndLimits.ddl.compactionRate", defaultMax)
-	p.DDLCompactionRate /= secondsPerMinute
+	p.MaxCompactionRate = p.Base.ParseFloatWithDefault("quotaAndLimits.compactionRate.max", defaultMax)
 	// [0 ~ Inf)
-	if p.DDLCompactionRate < 0 {
-		p.DDLCompactionRate = defaultMax
+	if p.MaxCompactionRate < 0 {
+		p.MaxCompactionRate = defaultMax
 	}
 }

--- a/internal/util/paramtable/quota_param_test.go
+++ b/internal/util/paramtable/quota_param_test.go
@ -36,9 +36,15 @@ func TestQuotaParam(t *testing.T) {
 		assert.Equal(t, false, qc.DDLLimitEnabled)
 		assert.Equal(t, defaultMax, qc.DDLCollectionRate)
 		assert.Equal(t, defaultMax, qc.DDLPartitionRate)
-		assert.Equal(t, defaultMax, qc.DDLIndexRate)
-		assert.Equal(t, defaultMax, qc.DDLFlushRate)
-		assert.Equal(t, defaultMax, qc.DDLCompactionRate)
+	})
+
+	t.Run("test functional params", func(t *testing.T) {
+		assert.Equal(t, false, qc.IndexLimitEnabled)
+		assert.Equal(t, defaultMax, qc.MaxIndexRate)
+		assert.Equal(t, false, qc.FlushLimitEnabled)
+		assert.Equal(t, defaultMax, qc.MaxFlushRate)
+		assert.Equal(t, false, qc.CompactionLimitEnabled)
+		assert.Equal(t, defaultMax, qc.MaxCompactionRate)
 	})

 	t.Run("test dml", func(t *testing.T) {