2021-10-11 13:15:00 +00:00
# Licensed to the LF AI & Data foundation under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
2020-11-18 09:32:52 +00:00
# with the License. You may obtain a copy of the License at
#
2021-10-11 13:15:00 +00:00
# http://www.apache.org/licenses/LICENSE-2.0
2020-11-18 09:32:52 +00:00
#
2021-10-11 13:15:00 +00:00
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
2020-11-18 09:32:52 +00:00
2021-09-23 08:38:24 +00:00
# Related configuration of etcd, used to store Milvus metadata.
2020-11-20 09:10:24 +00:00
etcd :
2021-06-11 14:04:41 +00:00
endpoints :
- localhost:2379
2021-12-07 06:14:08 +00:00
rootPath : by-dev # The root path where data is stored in etcd
2020-11-28 11:06:48 +00:00
metaSubPath : meta # metaRootPath = rootPath + '/' + metaSubPath
kvSubPath : kv # kvRootPath = rootPath + '/' + kvSubPath
2021-06-21 03:40:15 +00:00
segmentBinlogSubPath : datacoord/binlog/segment # Full Path = rootPath/metaSubPath/segmentBinlogSubPath
collectionBinlogSubPath : datacoord/binlog/collection # Full Path = rootPath/metaSubPath/collectionBinglogSubPath
flushStreamPosSubPath : datacoord/flushstream # Full path = rootPath/metaSubPath/flushStreamPosSubPath
statsStreamPosSubPath : datacoord/statsstream # Full path = rootPath/metaSubPath/statsStreamPosSubPath
2020-11-19 02:46:17 +00:00
2021-09-24 10:40:13 +00:00
# Related configuration of minio, which is responsible for data persistence for Milvus.
2020-12-08 06:41:04 +00:00
minio :
2021-11-30 06:17:12 +00:00
address : localhost # Address of MinIO/S3
2021-10-18 10:02:57 +00:00
port : 9000 # Port of MinIO/S3
2021-11-30 06:19:10 +00:00
accessKeyID : minioadmin # accessKeyID of MinIO/S3
2021-10-28 11:51:03 +00:00
secretAccessKey : minioadmin # MinIO/S3 encryption string
2021-12-02 10:19:33 +00:00
useSSL : false # Access to MinIO/S3 with SSL
2021-11-30 11:26:08 +00:00
bucketName : "a-bucket" # Bucket name in MinIO/S3
2021-12-03 05:30:16 +00:00
rootPath : files # The root path where the message is stored in MinIO/S3
2020-12-08 06:41:04 +00:00
2021-10-11 13:21:47 +00:00
# Related configuration of pulsar, used to manage Milvus logs of recent mutation operations, output streaming log, and provide log publish-subscribe services.
2020-11-20 09:10:24 +00:00
pulsar :
2021-12-01 05:07:53 +00:00
address : localhost # Address of pulsar
2021-11-30 06:05:57 +00:00
port : 6650 # Port of pulsar
2021-10-11 13:19:40 +00:00
maxMessageSize : 5242880 # 5 * 1024 * 1024 Bytes, Maximum size of each message in pulsar.
2020-11-19 02:46:17 +00:00
2021-06-25 11:44:11 +00:00
rocksmq :
2021-12-01 05:05:37 +00:00
path : /var/lib/milvus/rdb_data # The path where the message is stored in rocksmq
2021-12-03 05:32:12 +00:00
rocksmqPageSize : 2147483648 # 2 GB, 2 * 1024 * 1024 * 1024 bytes, The size of each page of messages in rocksmq
2021-12-01 05:17:31 +00:00
retentionTimeInMinutes : 10080 # 7 days, 7 * 24 * 60 minutes, The retention time of the message in rocksmq.
2021-12-02 10:15:44 +00:00
retentionSizeInMB : 8192 # 8 GB, 8 * 1024 MB, The retention size of the message in rocksmq.
2021-06-25 11:44:11 +00:00
2021-10-12 00:20:33 +00:00
# Related configuration of rootCoord, used to handle data definition language (DDL) and data control language (DCL) requests
2021-06-22 11:08:03 +00:00
rootCoord :
2020-11-20 09:10:24 +00:00
address : localhost
port : 53100
2020-11-19 02:46:17 +00:00
2021-08-04 05:03:24 +00:00
grpc :
2021-12-07 06:08:12 +00:00
serverMaxRecvSize : 2147483647 # math.MaxInt32, Maximum data size received by the server
2021-12-08 05:27:48 +00:00
serverMaxSendSize : 2147483647 # math.MaxInt32, Maximum data size sent by the server
2021-12-07 06:05:46 +00:00
clientMaxRecvSize : 104857600 # 100 MB, Maximum data size received by the client
2021-12-08 05:29:39 +00:00
clientMaxSendSize : 104857600 # 100 MB, Maximum data size sent by the client
2021-08-04 05:03:24 +00:00
2021-11-12 10:53:11 +00:00
dmlChannelNum : 256 # The number of dml channels created at system startup
maxPartitionNum : 4096 # Maximum number of partitions in a collection
minSegmentSizeToEnableIndex : 1024 # It's a threshold. When the segment size is less than this value, the segment will not be indexed
timeout : 3600 # time out, 5 seconds
2021-10-11 13:29:27 +00:00
# Related configuration of proxy, used to validate client requests and reduce the returned results.
2021-06-22 11:08:03 +00:00
proxy :
2021-03-04 14:27:12 +00:00
port : 19530
2020-11-20 09:10:24 +00:00
2021-08-04 05:03:24 +00:00
grpc :
2021-11-30 07:44:19 +00:00
serverMaxRecvSize : 536870912 # 512 MB, 100 * 1024 * 1024
serverMaxSendSize : 536870912 # 512 MB, 100 * 1024 * 1024
2021-08-04 05:03:24 +00:00
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-11-12 10:53:11 +00:00
timeTickInterval : 200 # ms, the interval that proxy synchronize the time tick
msgStream :
insert :
bufSize : 1024 # msgPack chan buffer size
search :
2021-12-01 05:15:35 +00:00
bufSize : 512 # msgPack chan buffer size
2021-11-12 10:53:11 +00:00
searchResult :
recvBufSize : 1024 # msgPack chan buffer size
pulsarBufSize : 1024 # pulsar chan buffer size
timeTick :
bufSize : 512
2021-12-07 06:45:45 +00:00
maxNameLength : 255 # Maximum length of name for a collection or alias
maxFieldNum : 256 # Maximum number of fields in a collection
maxDimension : 32768 # Maximum dimension of a vector
2021-11-12 10:53:11 +00:00
maxShardNum : 256 # Maximum number of shards in a collection
maxTaskNum : 1024 # max task number of proxy task queue
2021-11-16 06:13:12 +00:00
bufFlagExpireTime : 3600 # second, the time to expire bufFlag from cache in collectResultLoop
bufFlagCleanupInterval : 600 # second, the interval to clean bufFlag cache in collectResultLoop
2021-11-12 10:53:11 +00:00
2021-10-11 08:28:05 +00:00
# Related configuration of queryCoord, used to manage topology and load balancing for the query nodes, and handoff from growing segments to sealed segments.
2021-06-22 08:44:09 +00:00
queryCoord :
2021-01-22 06:28:06 +00:00
address : localhost
port : 19531
2021-12-06 10:02:50 +00:00
autoHandoff : true # Enable auto handoff
2021-12-08 07:02:09 +00:00
autoBalance : true # Enable auto balance
2021-12-06 10:05:32 +00:00
overloadedMemoryThresholdPercentage : 90 # The threshold percentage that memory overload
2021-11-12 10:49:10 +00:00
balanceIntervalSeconds : 60
memoryUsageMaxDifferencePercentage : 30
2021-01-22 06:28:06 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-10-11 13:31:16 +00:00
# Related configuration of queryNode, used to run hybrid search between vector and scalar data.
2020-11-20 09:10:24 +00:00
queryNode :
2021-09-28 14:24:03 +00:00
cacheSize : 32 # GB, default 32 GB, `cacheSize` is the memory used for caching data for faster query. The `cacheSize` must be less than system memory size.
2021-10-28 12:22:59 +00:00
gracefulTime : 0 # Minimum time before the newly inserted data can be searched (in ms)
2021-02-23 10:08:17 +00:00
port : 21123
2021-01-19 10:32:57 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-11-12 10:53:11 +00:00
stats :
publishInterval : 1000 # Interval for querynode to report node information (milliseconds)
dataSync :
flowGraph :
maxQueueLength : 1024 # Maximum length of task queue in flowgraph
maxParallelism : 1024 # Maximum number of tasks executed in parallel in the flowgraph
msgStream :
search :
recvBufSize : 512 # msgPack channel buffer size
pulsarBufSize : 512 # pulsar channel buffer size
searchResult :
recvBufSize : 64 # msgPack channel buffer size
# Segcore will divide a segment into multiple chunks.
segcore :
chunkRows : 32768 # The number of vectors in a chunk.
2021-06-22 11:08:03 +00:00
indexCoord :
2021-01-19 10:32:57 +00:00
address : localhost
2021-01-26 01:38:40 +00:00
port : 31000
2021-01-24 13:20:11 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-02-23 10:08:17 +00:00
indexNode :
port : 21121
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-06-21 10:22:13 +00:00
dataCoord :
2021-01-26 07:13:20 +00:00
address : localhost
port : 13333
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-12-07 11:35:13 +00:00
enableCompaction : true # Enable data segment compression
2021-11-11 15:38:42 +00:00
enableGarbageCollection : false
2021-08-04 05:03:24 +00:00
2021-11-12 10:53:11 +00:00
segment :
maxSize : 512 # Maximum size of a segment in MB
sealProportion : 0.75 # It's the minimum proportion for a segment which can be sealed
2021-12-03 05:34:06 +00:00
assignmentExpiration : 2000 # The time of the assignment expiration in ms
2021-11-12 10:53:11 +00:00
2021-11-16 03:47:10 +00:00
compaction :
2021-12-10 06:41:14 +00:00
enableAutoCompaction : true
2021-11-16 03:47:10 +00:00
2021-11-18 14:29:40 +00:00
gc :
interval : 3600 # gc interval in seconds
missingTolerance : 86400 # file meta missing tolerance duration in seconds, 60*24
dropTolerance : 86400 # file belongs to dropped entity tolerance duration in seconds, 60*24
2021-01-24 13:20:11 +00:00
dataNode :
port : 21124
2021-02-19 07:37:04 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-11-12 10:53:11 +00:00
dataSync :
flowGraph :
maxQueueLength : 1024 # Maximum length of task queue in flowgraph
maxParallelism : 1024 # Maximum number of tasks executed in parallel in the flowgraph
flush :
# Max buffer size to flush for a single segment.
insertBufSize : 16777216 # Bytes, 16 MB
2021-09-22 11:23:59 +00:00
# Configure whether to store the vector and the local path when querying/searching in Querynode.
2021-08-18 08:30:11 +00:00
localStorage :
2021-07-09 03:44:40 +00:00
path : /var/lib/milvus/data/
2021-08-18 08:30:11 +00:00
enabled : true
2021-07-09 03:44:40 +00:00
2021-09-09 10:48:02 +00:00
# Configures the system log output.
2021-02-19 07:37:04 +00:00
log :
2021-06-19 04:38:06 +00:00
level : debug # info, warn, error, panic, fatal
2021-02-19 07:37:04 +00:00
file :
2021-04-13 02:04:39 +00:00
rootPath : "" # default to stdout, stderr
2021-02-19 07:37:04 +00:00
maxSize : 300 # MB
2021-12-01 05:09:49 +00:00
maxAge : 10 # Maximum time for log retention in day.
2021-02-19 07:37:04 +00:00
maxBackups : 20
2021-03-16 13:30:44 +00:00
format : text # text/json
2021-09-26 11:46:17 +00:00
msgChannel :
2021-10-09 02:55:14 +00:00
# Channel name generation rule: ${namePrefix}-${ChannelIdx}
2021-09-26 11:46:17 +00:00
chanNamePrefix :
2021-12-29 13:29:45 +00:00
cluster : "by-dev"
2021-09-26 11:46:17 +00:00
rootCoordTimeTick : "rootcoord-timetick"
rootCoordStatistics : "rootcoord-statistics"
rootCoordDml : "rootcoord-dml"
2021-11-03 13:04:14 +00:00
rootCoordDelta : "rootcoord-delta"
2021-09-26 11:46:17 +00:00
search : "search"
searchResult : "searchResult"
proxyTimeTick : "proxyTimeTick"
queryTimeTick : "queryTimeTick"
queryNodeStats : "query-node-stats"
2021-10-09 02:55:14 +00:00
# Cmd for loadIndex, flush, etc...
2021-09-26 11:46:17 +00:00
cmd : "cmd"
dataCoordInsertChannel : "insert-channel-"
dataCoordStatistic : "datacoord-statistics-channel"
dataCoordTimeTick : "datacoord-timetick-channel"
dataCoordSegmentInfo : "segment-info-channel"
2021-11-05 06:57:44 +00:00
# skip replay query channel under failure recovery
skipQueryChannelRecovery : "false"
2021-09-26 11:46:17 +00:00
2021-10-09 02:55:14 +00:00
# Sub name generation rule: ${subNamePrefix}-${NodeID}
2021-09-26 11:46:17 +00:00
subNamePrefix :
rootCoordSubNamePrefix : "rootCoord"
proxySubNamePrefix : "proxy"
queryNodeSubNamePrefix : "queryNode"
dataNodeSubNamePrefix : "dataNode"
dataCoordSubNamePrefix : "dataCoord"
common :
defaultPartitionName : "_default" # default partition name for a collection
2021-10-09 02:55:14 +00:00
defaultIndexName : "_default_idx" # default index name
2021-12-29 13:29:45 +00:00
retentionDuration : 432000 # 5 days in seconds
2021-11-01 02:26:03 +00:00
knowhere :
# Default value: auto
2021-11-08 02:21:04 +00:00
# Valid values: [auto, avx512, avx2, avx, sse4_2]
2021-11-01 02:26:03 +00:00
# This configuration is only used by querynode and indexnode, it selects CPU instruction set for Searching and Index-building.
simdType : auto