2021-10-11 13:15:00 +00:00
# Licensed to the LF AI & Data foundation under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
2020-11-18 09:32:52 +00:00
# with the License. You may obtain a copy of the License at
#
2021-10-11 13:15:00 +00:00
# http://www.apache.org/licenses/LICENSE-2.0
2020-11-18 09:32:52 +00:00
#
2021-10-11 13:15:00 +00:00
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
2020-11-18 09:32:52 +00:00
2021-09-23 08:38:24 +00:00
# Related configuration of etcd, used to store Milvus metadata.
2020-11-20 09:10:24 +00:00
etcd :
2021-06-11 14:04:41 +00:00
endpoints :
- localhost:2379
2020-11-20 09:10:24 +00:00
rootPath : by-dev
2020-11-28 11:06:48 +00:00
metaSubPath : meta # metaRootPath = rootPath + '/' + metaSubPath
kvSubPath : kv # kvRootPath = rootPath + '/' + kvSubPath
2021-06-21 03:40:15 +00:00
segmentBinlogSubPath : datacoord/binlog/segment # Full Path = rootPath/metaSubPath/segmentBinlogSubPath
collectionBinlogSubPath : datacoord/binlog/collection # Full Path = rootPath/metaSubPath/collectionBinglogSubPath
flushStreamPosSubPath : datacoord/flushstream # Full path = rootPath/metaSubPath/flushStreamPosSubPath
statsStreamPosSubPath : datacoord/statsstream # Full path = rootPath/metaSubPath/statsStreamPosSubPath
2020-11-19 02:46:17 +00:00
2021-09-24 10:40:13 +00:00
# Related configuration of minio, which is responsible for data persistence for Milvus.
2020-12-08 06:41:04 +00:00
minio :
address : localhost
2021-10-18 10:02:57 +00:00
port : 9000 # Port of MinIO/S3
2020-12-08 06:41:04 +00:00
accessKeyID : minioadmin
2021-10-28 11:51:03 +00:00
secretAccessKey : minioadmin # MinIO/S3 encryption string
2020-12-08 06:41:04 +00:00
useSSL : false
2020-12-26 08:28:55 +00:00
bucketName : "a-bucket"
2021-09-24 12:50:23 +00:00
rootPath : files
2020-12-08 06:41:04 +00:00
2021-10-11 13:21:47 +00:00
# Related configuration of pulsar, used to manage Milvus logs of recent mutation operations, output streaming log, and provide log publish-subscribe services.
2020-11-20 09:10:24 +00:00
pulsar :
address : localhost
port : 6650
2021-10-11 13:19:40 +00:00
maxMessageSize : 5242880 # 5 * 1024 * 1024 Bytes, Maximum size of each message in pulsar.
2020-11-19 02:46:17 +00:00
2021-06-25 11:44:11 +00:00
rocksmq :
2021-11-08 02:17:18 +00:00
path : /var/lib/milvus/rdb_data
2021-11-11 09:18:43 +00:00
rocksmqPageSize : 2147483648 # 2 GB, 2 * 1024 * 1024 * 1024 bytes
retentionTimeInMinutes : 10080 # 7 days, 7 * 24 * 60 minutes
retentionSizeInMB : 8192 # 8 GB, 8 * 1024 MB
2021-06-25 11:44:11 +00:00
2021-10-12 00:20:33 +00:00
# Related configuration of rootCoord, used to handle data definition language (DDL) and data control language (DCL) requests
2021-06-22 11:08:03 +00:00
rootCoord :
2020-11-20 09:10:24 +00:00
address : localhost
port : 53100
2020-11-19 02:46:17 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-11-12 10:53:11 +00:00
dmlChannelNum : 256 # The number of dml channels created at system startup
maxPartitionNum : 4096 # Maximum number of partitions in a collection
minSegmentSizeToEnableIndex : 1024 # It's a threshold. When the segment size is less than this value, the segment will not be indexed
timeout : 3600 # time out, 5 seconds
timeTickInterval : 200 # ms, the interval that proxy synchronize the time tick
2021-10-11 13:29:27 +00:00
# Related configuration of proxy, used to validate client requests and reduce the returned results.
2021-06-22 11:08:03 +00:00
proxy :
2021-03-04 14:27:12 +00:00
port : 19530
2020-11-20 09:10:24 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-11-12 10:53:11 +00:00
timeTickInterval : 200 # ms, the interval that proxy synchronize the time tick
msgStream :
insert :
bufSize : 1024 # msgPack chan buffer size
search :
bufSize : 512
searchResult :
recvBufSize : 1024 # msgPack chan buffer size
pulsarBufSize : 1024 # pulsar chan buffer size
timeTick :
bufSize : 512
maxNameLength : 255 # max name length of collection or alias
maxFieldNum : 64 # max field number of a collection
maxDimension : 32768 # Maximum dimension of vector
maxShardNum : 256 # Maximum number of shards in a collection
maxTaskNum : 1024 # max task number of proxy task queue
2021-10-11 08:28:05 +00:00
# Related configuration of queryCoord, used to manage topology and load balancing for the query nodes, and handoff from growing segments to sealed segments.
2021-06-22 08:44:09 +00:00
queryCoord :
2021-01-22 06:28:06 +00:00
address : localhost
port : 19531
2021-10-24 14:39:09 +00:00
autoHandoff : true
2021-11-12 10:49:10 +00:00
autoBalance : false
overloadedMemoryThresholdPercentage : 90
balanceIntervalSeconds : 60
memoryUsageMaxDifferencePercentage : 30
2021-01-22 06:28:06 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-10-11 13:31:16 +00:00
# Related configuration of queryNode, used to run hybrid search between vector and scalar data.
2020-11-20 09:10:24 +00:00
queryNode :
2021-09-28 14:24:03 +00:00
cacheSize : 32 # GB, default 32 GB, `cacheSize` is the memory used for caching data for faster query. The `cacheSize` must be less than system memory size.
2021-10-28 12:22:59 +00:00
gracefulTime : 0 # Minimum time before the newly inserted data can be searched (in ms)
2021-02-23 10:08:17 +00:00
port : 21123
2021-01-19 10:32:57 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-11-12 10:53:11 +00:00
stats :
publishInterval : 1000 # Interval for querynode to report node information (milliseconds)
dataSync :
flowGraph :
maxQueueLength : 1024 # Maximum length of task queue in flowgraph
maxParallelism : 1024 # Maximum number of tasks executed in parallel in the flowgraph
msgStream :
search :
recvBufSize : 512 # msgPack channel buffer size
pulsarBufSize : 512 # pulsar channel buffer size
searchResult :
recvBufSize : 64 # msgPack channel buffer size
# Segcore will divide a segment into multiple chunks.
segcore :
chunkRows : 32768 # The number of vectors in a chunk.
2021-06-22 11:08:03 +00:00
indexCoord :
2021-01-19 10:32:57 +00:00
address : localhost
2021-01-26 01:38:40 +00:00
port : 31000
2021-01-24 13:20:11 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-02-23 10:08:17 +00:00
indexNode :
port : 21121
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-06-21 10:22:13 +00:00
dataCoord :
2021-01-26 07:13:20 +00:00
address : localhost
port : 13333
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-11-11 15:38:42 +00:00
enableCompaction : false
enableGarbageCollection : false
2021-08-04 05:03:24 +00:00
2021-11-12 10:53:11 +00:00
segment :
maxSize : 512 # Maximum size of a segment in MB
sealProportion : 0.75 # It's the minimum proportion for a segment which can be sealed
assignmentExpiration : 2000 # ms
2021-01-24 13:20:11 +00:00
dataNode :
port : 21124
2021-02-19 07:37:04 +00:00
2021-08-04 05:03:24 +00:00
grpc :
serverMaxRecvSize : 2147483647 # math.MaxInt32
serverMaxSendSize : 2147483647 # math.MaxInt32
clientMaxRecvSize : 104857600 # 100 MB, 100 * 1024 * 1024
clientMaxSendSize : 104857600 # 100 MB, 100 * 1024 * 1024
2021-11-12 10:53:11 +00:00
dataSync :
flowGraph :
maxQueueLength : 1024 # Maximum length of task queue in flowgraph
maxParallelism : 1024 # Maximum number of tasks executed in parallel in the flowgraph
flush :
# Max buffer size to flush for a single segment.
insertBufSize : 16777216 # Bytes, 16 MB
2021-09-22 11:23:59 +00:00
# Configure whether to store the vector and the local path when querying/searching in Querynode.
2021-08-18 08:30:11 +00:00
localStorage :
2021-07-09 03:44:40 +00:00
path : /var/lib/milvus/data/
2021-08-18 08:30:11 +00:00
enabled : true
2021-07-09 03:44:40 +00:00
2021-09-09 10:48:02 +00:00
# Configures the system log output.
2021-02-19 07:37:04 +00:00
log :
2021-06-19 04:38:06 +00:00
level : debug # info, warn, error, panic, fatal
2021-02-19 07:37:04 +00:00
file :
2021-04-13 02:04:39 +00:00
rootPath : "" # default to stdout, stderr
2021-02-19 07:37:04 +00:00
maxSize : 300 # MB
maxAge : 10 # day
maxBackups : 20
2021-03-16 13:30:44 +00:00
format : text # text/json
2021-09-26 11:46:17 +00:00
msgChannel :
2021-10-09 02:55:14 +00:00
# Channel name generation rule: ${namePrefix}-${ChannelIdx}
2021-09-26 11:46:17 +00:00
chanNamePrefix :
cluster : "by-dev"
rootCoordTimeTick : "rootcoord-timetick"
rootCoordStatistics : "rootcoord-statistics"
rootCoordDml : "rootcoord-dml"
2021-11-03 13:04:14 +00:00
rootCoordDelta : "rootcoord-delta"
2021-09-26 11:46:17 +00:00
search : "search"
searchResult : "searchResult"
proxyTimeTick : "proxyTimeTick"
queryTimeTick : "queryTimeTick"
queryNodeStats : "query-node-stats"
2021-10-09 02:55:14 +00:00
# Cmd for loadIndex, flush, etc...
2021-09-26 11:46:17 +00:00
cmd : "cmd"
dataCoordInsertChannel : "insert-channel-"
dataCoordStatistic : "datacoord-statistics-channel"
dataCoordTimeTick : "datacoord-timetick-channel"
dataCoordSegmentInfo : "segment-info-channel"
2021-11-05 06:57:44 +00:00
# skip replay query channel under failure recovery
skipQueryChannelRecovery : "false"
2021-09-26 11:46:17 +00:00
2021-10-09 02:55:14 +00:00
# Sub name generation rule: ${subNamePrefix}-${NodeID}
2021-09-26 11:46:17 +00:00
subNamePrefix :
rootCoordSubNamePrefix : "rootCoord"
proxySubNamePrefix : "proxy"
queryNodeSubNamePrefix : "queryNode"
dataNodeSubNamePrefix : "dataNode"
dataCoordSubNamePrefix : "dataCoord"
common :
defaultPartitionName : "_default" # default partition name for a collection
2021-10-09 02:55:14 +00:00
defaultIndexName : "_default_idx" # default index name
2021-11-01 02:26:03 +00:00
knowhere :
# Default value: auto
2021-11-08 02:21:04 +00:00
# Valid values: [auto, avx512, avx2, avx, sse4_2]
2021-11-01 02:26:03 +00:00
# This configuration is only used by querynode and indexnode, it selects CPU instruction set for Searching and Index-building.
simdType : auto