milvus/internal/metrics/metrics.go

651 lines
23 KiB
Go

package metrics
import (
"net/http"
"github.com/milvus-io/milvus/internal/log"
"github.com/prometheus/client_golang/prometheus"
"github.com/prometheus/client_golang/prometheus/promhttp"
"go.uber.org/zap"
)
const (
milvusNamespace = "milvus"
subSystemRootCoord = "rootcoord"
subSystemDataCoord = "dataCoord"
subSystemDataNode = "dataNode"
subSystemProxy = "proxy"
)
var (
// RootCoordProxyLister counts the num of registered proxy nodes
RootCoordProxyLister = prometheus.NewGaugeVec(
prometheus.GaugeOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "list_of_proxy",
Help: "List of proxy nodes which have registered with etcd",
}, []string{"client_id"})
////////////////////////////////////////////////////////////////////////////
// for grpc
// RootCoordCreateCollectionCounter counts the num of calls of CreateCollection
RootCoordCreateCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "create_collection_total",
Help: "Counter of create collection",
}, []string{"client_id", "type"})
// RootCoordDropCollectionCounter used to count the num of calls of DropCollection
RootCoordDropCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "drop_collection_total",
Help: "Counter of drop collection",
}, []string{"client_id", "type"})
// RootCoordHasCollectionCounter used to count the num of calls of HasCollection
RootCoordHasCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "has_collection_total",
Help: "Counter of has collection",
}, []string{"client_id", "type"})
// RootCoordDescribeCollectionCounter used to count the num of calls of DescribeCollection
RootCoordDescribeCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "describe_collection_total",
Help: "Counter of describe collection",
}, []string{"client_id", "type"})
// RootCoordShowCollectionsCounter used to count the num of calls of ShowCollections
RootCoordShowCollectionsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "show_collections_total",
Help: "Counter of show collections",
}, []string{"client_id", "type"})
// RootCoordCreatePartitionCounter used to count the num of calls of CreatePartition
RootCoordCreatePartitionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "create_partition_total",
Help: "Counter of create partition",
}, []string{"client_id", "type"})
// RootCoordDropPartitionCounter used to count the num of calls of DropPartition
RootCoordDropPartitionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "drop_partition_total",
Help: "Counter of drop partition",
}, []string{"client_id", "type"})
// RootCoordHasPartitionCounter used to count the num of calls of HasPartition
RootCoordHasPartitionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "has_partition_total",
Help: "Counter of has partition",
}, []string{"client_id", "type"})
// RootCoordShowPartitionsCounter used to count the num of calls of ShowPartitions
RootCoordShowPartitionsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "show_partitions_total",
Help: "Counter of show partitions",
}, []string{"client_id", "type"})
// RootCoordCreateIndexCounter used to count the num of calls of CreateIndex
RootCoordCreateIndexCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "create_index_total",
Help: "Counter of create index",
}, []string{"client_id", "type"})
// RootCoordDropIndexCounter used to count the num of calls of DropIndex
RootCoordDropIndexCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "drop_index_total",
Help: "Counter of drop index",
}, []string{"client_id", "type"})
// RootCoordDescribeIndexCounter used to count the num of calls of DescribeIndex
RootCoordDescribeIndexCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "describe_index_total",
Help: "Counter of describe index",
}, []string{"client_id", "type"})
// RootCoordDescribeSegmentCounter used to count the num of calls of DescribeSegment
RootCoordDescribeSegmentCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "describe_segment_total",
Help: "Counter of describe segment",
}, []string{"client_id", "type"})
// RootCoordShowSegmentsCounter used to count the num of calls of ShowSegments
RootCoordShowSegmentsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "show_segments_total",
Help: "Counter of show segments",
}, []string{"client_id", "type"})
////////////////////////////////////////////////////////////////////////////
// for time tick
// RootCoordInsertChannelTimeTick used to count the time tick num of insert channel in 24H
RootCoordInsertChannelTimeTick = prometheus.NewGaugeVec(
prometheus.GaugeOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "insert_channel_time_tick",
Help: "Time tick of insert Channel in 24H",
}, []string{"vchannel"})
// RootCoordDDChannelTimeTick used to count the time tick num of dd channel in 24H
RootCoordDDChannelTimeTick = prometheus.NewGauge(
prometheus.GaugeOpts{
Namespace: milvusNamespace,
Subsystem: subSystemRootCoord,
Name: "dd_channel_time_tick",
Help: "Time tick of dd Channel in 24H",
})
)
//RegisterRootCoord register RootCoord metrics
func RegisterRootCoord() {
prometheus.MustRegister(RootCoordProxyLister)
// for grpc
prometheus.MustRegister(RootCoordCreateCollectionCounter)
prometheus.MustRegister(RootCoordDropCollectionCounter)
prometheus.MustRegister(RootCoordHasCollectionCounter)
prometheus.MustRegister(RootCoordDescribeCollectionCounter)
prometheus.MustRegister(RootCoordShowCollectionsCounter)
prometheus.MustRegister(RootCoordCreatePartitionCounter)
prometheus.MustRegister(RootCoordDropPartitionCounter)
prometheus.MustRegister(RootCoordHasPartitionCounter)
prometheus.MustRegister(RootCoordShowPartitionsCounter)
prometheus.MustRegister(RootCoordCreateIndexCounter)
prometheus.MustRegister(RootCoordDropIndexCounter)
prometheus.MustRegister(RootCoordDescribeIndexCounter)
prometheus.MustRegister(RootCoordDescribeSegmentCounter)
prometheus.MustRegister(RootCoordShowSegmentsCounter)
// for time tick
prometheus.MustRegister(RootCoordInsertChannelTimeTick)
prometheus.MustRegister(RootCoordDDChannelTimeTick)
//prometheus.MustRegister(PanicCounter)
}
var (
// ProxyCreateCollectionCounter used to count the num of calls of CreateCollection
ProxyCreateCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "create_collection_total",
Help: "Counter of create collection",
}, []string{"status"})
// ProxyDropCollectionCounter used to count the num of calls of DropCollection
ProxyDropCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "drop_collection_total",
Help: "Counter of drop collection",
}, []string{"status"})
// ProxyHasCollectionCounter used to count the num of calls of HasCollection
ProxyHasCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "has_collection_total",
Help: "Counter of has collection",
}, []string{"status"})
// ProxyLoadCollectionCounter used to count the num of calls of LoadCollection
ProxyLoadCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "load_collection_total",
Help: "Counter of load collection",
}, []string{"status"})
// ProxyReleaseCollectionCounter used to count the num of calls of ReleaseCollection
ProxyReleaseCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "release_collection_total",
Help: "Counter of release collection",
}, []string{"status"})
// ProxyDescribeCollectionCounter used to count the num of calls of DescribeCollection
ProxyDescribeCollectionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "describe_collection_total",
Help: "Counter of describe collection",
}, []string{"status"})
// ProxyGetCollectionStatisticsCounter used to count the num of calls of GetCollectionStatistics
ProxyGetCollectionStatisticsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "get_collection_statistics_total",
Help: "Counter of get collection statistics",
}, []string{"status"})
// ProxyShowCollectionsCounter used to count the num of calls of ShowCollections
ProxyShowCollectionsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "show_collections_total",
Help: "Counter of show collections",
}, []string{"status"})
// ProxyCreatePartitionCounter used to count the num of calls of CreatePartition
ProxyCreatePartitionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "create_partition_total",
Help: "Counter of create partition",
}, []string{"status"})
// ProxyDropPartitionCounter used to count the num of calls of DropPartition
ProxyDropPartitionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "drop_partition_total",
Help: "Counter of drop partition",
}, []string{"status"})
// ProxyHasPartitionCounter used to count the num of calls of HasPartition
ProxyHasPartitionCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "has_partition_total",
Help: "Counter of has partition",
}, []string{"status"})
// ProxyLoadPartitionsCounter used to count the num of calls of LoadPartitions
ProxyLoadPartitionsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "load_partitions_total",
Help: "Counter of load partitions",
}, []string{"status"})
// ProxyReleasePartitionsCounter used to count the num of calls of ReleasePartitions
ProxyReleasePartitionsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "release_partitions_total",
Help: "Counter of release partitions",
}, []string{"status"})
// ProxyGetPartitionStatisticsCounter used to count the num of calls of GetPartitionStatistics
ProxyGetPartitionStatisticsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "get_partition_statistics_total",
Help: "Counter of get partition statistics",
}, []string{"status"})
// ProxyShowPartitionsCounter used to count the num of calls of ShowPartitions
ProxyShowPartitionsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "show_partitions_total",
Help: "Counter of show partitions",
}, []string{"status"})
// ProxyCreateIndexCounter used to count the num of calls of CreateIndex
ProxyCreateIndexCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "create_index_counter",
Help: "Counter of create index",
}, []string{"status"})
// ProxyDescribeIndexCounter used to count the num of calls of DescribeIndex
ProxyDescribeIndexCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "describe_index_counter",
Help: "Counter of describe index",
}, []string{"status"})
// ProxyGetIndexStateCounter used to count the num of calls of GetIndexState
ProxyGetIndexStateCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "get_index_state_counter",
Help: "Counter of get index state",
}, []string{"status"})
// ProxyGetIndexBuildProgressCounter used to count the num of calls of GetIndexBuildProgress
ProxyGetIndexBuildProgressCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "get_index_build_progress_total",
Help: "Counter of get index build progress",
}, []string{"status"})
// ProxyDropIndexCounter used to count the num of calls of DropIndex
ProxyDropIndexCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "drop_index_total",
Help: "Counter of drop index",
}, []string{"status"})
// ProxyInsertCounter used to count the num of calls of Insert
ProxyInsertCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "insert_total",
Help: "Counter of insert",
}, []string{"status"})
// ProxySearchCounter used to count the num of calls of Search
ProxySearchCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "search_total",
Help: "Counter of search",
}, []string{"status"})
// ProxyRetrieveCounter used to count the num of calls of Retrieve
ProxyRetrieveCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "retrieve_total",
Help: "Counter of retrieve",
}, []string{"status"})
// ProxyFlushCounter used to count the num of calls of Flush
ProxyFlushCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "flush_total",
Help: "Counter of flush",
}, []string{"status"})
// ProxyQueryCounter used to count the num of calls of Query
ProxyQueryCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "query_total",
Help: "Counter of query",
}, []string{"status"})
// ProxyGetPersistentSegmentInfoCounter used to count the num of calls of GetPersistentSegmentInfo
ProxyGetPersistentSegmentInfoCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "get_persistent_segment_info_total",
Help: "Counter of get persistent segment info",
}, []string{"status"})
// ProxyGetQuerySegmentInfoCounter used to count the num of calls of GetQuerySegmentInfo
ProxyGetQuerySegmentInfoCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "get_query_segment_info_total",
Help: "Counter of get query segment info",
}, []string{"status"})
// ProxyDummyCounter used to count the num of calls of Dummy
ProxyDummyCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "dummy_total",
Help: "Counter of dummy",
}, []string{"status"})
// ProxyRegisterLinkCounter used to count the num of calls of RegisterLink
ProxyRegisterLinkCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "register_link_total",
Help: "Counter of register link",
}, []string{"status"})
// ProxyGetComponentStatesCounter used to count the num of calls of GetComponentStates
ProxyGetComponentStatesCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "get_component_states_total",
Help: "Counter of get component states",
}, []string{"status"})
// ProxyGetStatisticsChannelCounter used to count the num of calls of GetStatisticsChannel
ProxyGetStatisticsChannelCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "get_statistics_channel_total",
Help: "Counter of get statistics channel",
}, []string{"status"})
// ProxyInvalidateCollectionMetaCacheCounter used to count the num of calls of InvalidateCollectionMetaCache
ProxyInvalidateCollectionMetaCacheCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "invalidate_collection_meta_cache_total",
Help: "Counter of invalidate collection meta cache",
}, []string{"status"})
// ProxyGetDdChannelCounter used to count the num of calls of GetDdChannel
ProxyGetDdChannelCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "get_dd_channel_total",
Help: "Counter of get dd channel",
}, []string{"status"})
// ProxyReleaseDQLMessageStreamCounter used to count the num of calls of ReleaseDQLMessageStream
ProxyReleaseDQLMessageStreamCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "release_dql_message_stream_total",
Help: "Counter of release dql message stream",
}, []string{"status"})
// ProxyDmlChannelTimeTick used to count the time tick value of dml channels
ProxyDmlChannelTimeTick = prometheus.NewGaugeVec(
prometheus.GaugeOpts{
Namespace: milvusNamespace,
Subsystem: subSystemProxy,
Name: "dml_channels_time_tick",
Help: "Time tick of dml channels",
}, []string{"pchan"})
)
//RegisterProxy register Proxy metrics
func RegisterProxy() {
prometheus.MustRegister(ProxyCreateCollectionCounter)
prometheus.MustRegister(ProxyDropCollectionCounter)
prometheus.MustRegister(ProxyHasCollectionCounter)
prometheus.MustRegister(ProxyLoadCollectionCounter)
prometheus.MustRegister(ProxyReleaseCollectionCounter)
prometheus.MustRegister(ProxyDescribeCollectionCounter)
prometheus.MustRegister(ProxyGetCollectionStatisticsCounter)
prometheus.MustRegister(ProxyShowCollectionsCounter)
prometheus.MustRegister(ProxyCreatePartitionCounter)
prometheus.MustRegister(ProxyDropPartitionCounter)
prometheus.MustRegister(ProxyHasPartitionCounter)
prometheus.MustRegister(ProxyLoadPartitionsCounter)
prometheus.MustRegister(ProxyReleasePartitionsCounter)
prometheus.MustRegister(ProxyGetPartitionStatisticsCounter)
prometheus.MustRegister(ProxyShowPartitionsCounter)
prometheus.MustRegister(ProxyCreateIndexCounter)
prometheus.MustRegister(ProxyDescribeIndexCounter)
prometheus.MustRegister(ProxyGetIndexStateCounter)
prometheus.MustRegister(ProxyGetIndexBuildProgressCounter)
prometheus.MustRegister(ProxyDropIndexCounter)
prometheus.MustRegister(ProxyInsertCounter)
prometheus.MustRegister(ProxySearchCounter)
prometheus.MustRegister(ProxyRetrieveCounter)
prometheus.MustRegister(ProxyFlushCounter)
prometheus.MustRegister(ProxyQueryCounter)
prometheus.MustRegister(ProxyGetPersistentSegmentInfoCounter)
prometheus.MustRegister(ProxyGetQuerySegmentInfoCounter)
prometheus.MustRegister(ProxyDummyCounter)
prometheus.MustRegister(ProxyRegisterLinkCounter)
prometheus.MustRegister(ProxyGetComponentStatesCounter)
prometheus.MustRegister(ProxyGetStatisticsChannelCounter)
prometheus.MustRegister(ProxyInvalidateCollectionMetaCacheCounter)
prometheus.MustRegister(ProxyGetDdChannelCounter)
prometheus.MustRegister(ProxyReleaseDQLMessageStreamCounter)
prometheus.MustRegister(ProxyDmlChannelTimeTick)
}
//RegisterQueryCoord register QueryCoord metrics
func RegisterQueryCoord() {
}
//RegisterQueryNode register QueryNode metrics
func RegisterQueryNode() {
}
var (
//DataCoordDataNodeList records the num of regsitered data nodes
DataCoordDataNodeList = prometheus.NewGaugeVec(
prometheus.GaugeOpts{
Namespace: milvusNamespace,
Subsystem: subSystemDataCoord,
Name: "list_of_data_node",
Help: "List of data nodes registered within etcd",
}, []string{"status"},
)
)
//RegisterDataCoord register DataCoord metrics
func RegisterDataCoord() {
prometheus.MustRegister(DataCoordDataNodeList)
}
var (
// DataNodeFlushSegmentsCounter used to count the num of calls of FlushSegments
DataNodeFlushSegmentsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemDataNode,
Name: "flush_segments_total",
Help: "Counter of flush segments",
}, []string{"type"})
// DataNodeWatchDmChannelsCounter used to count the num of calls of WatchDmChannels
DataNodeWatchDmChannelsCounter = prometheus.NewCounterVec(
prometheus.CounterOpts{
Namespace: milvusNamespace,
Subsystem: subSystemDataNode,
Name: "watch_dm_channels_total",
Help: "Counter of watch dm channel",
}, []string{"type"})
)
//RegisterDataNode register DataNode metrics
func RegisterDataNode() {
prometheus.MustRegister(DataNodeFlushSegmentsCounter)
prometheus.MustRegister(DataNodeWatchDmChannelsCounter)
}
//RegisterIndexCoord register IndexCoord metrics
func RegisterIndexCoord() {
}
//RegisterIndexNode register IndexNode metrics
func RegisterIndexNode() {
}
//RegisterMsgStreamCoord register MsgStreamCoord metrics
func RegisterMsgStreamCoord() {
}
//ServeHTTP serve prometheus http service
func ServeHTTP() {
http.Handle("/metrics", promhttp.Handler())
go func() {
if err := http.ListenAndServe(":9091", nil); err != nil {
log.Error("handle metrics failed", zap.Error(err))
}
}()
}