mirror of
https://github.com/minio/minio.git
synced 2025-01-11 15:03:22 -05:00
re-implement prometheus metrics endpoint to be simpler (#13922)
data-structures were repeatedly initialized this causes GC pressure, instead re-use the collectors. Initialize collectors in `init()`, also make sure to honor the cache semantics for performance requirements. Avoid a global map and a global lock for metrics lookup instead let them all be lock-free unless the cache is being invalidated.
This commit is contained in:
parent
890f43ffa5
commit
818f0201fc
@ -35,6 +35,51 @@ import (
|
||||
"github.com/prometheus/procfs"
|
||||
)
|
||||
|
||||
var (
|
||||
nodeCollector *minioNodeCollector
|
||||
clusterCollector *minioClusterCollector
|
||||
peerMetricsGroups []*MetricsGroup
|
||||
)
|
||||
|
||||
func init() {
|
||||
clusterMetricsGroups := []*MetricsGroup{
|
||||
getBucketUsageMetrics(),
|
||||
getMinioHealingMetrics(),
|
||||
getNodeHealthMetrics(),
|
||||
getClusterStorageMetrics(),
|
||||
}
|
||||
|
||||
peerMetricsGroups = []*MetricsGroup{
|
||||
getCacheMetrics(),
|
||||
getGoMetrics(),
|
||||
getHTTPMetrics(),
|
||||
getLocalStorageMetrics(),
|
||||
getMinioProcMetrics(),
|
||||
getMinioVersionMetrics(),
|
||||
getNetworkMetrics(),
|
||||
getS3TTFBMetric(),
|
||||
getILMNodeMetrics(),
|
||||
getScannerNodeMetrics(),
|
||||
}
|
||||
|
||||
allMetricsGroups := func() (allMetrics []*MetricsGroup) {
|
||||
allMetrics = append(allMetrics, clusterMetricsGroups...)
|
||||
allMetrics = append(allMetrics, peerMetricsGroups...)
|
||||
return allMetrics
|
||||
}()
|
||||
|
||||
nodeCollector = newMinioCollectorNode([]*MetricsGroup{
|
||||
getNodeHealthMetrics(),
|
||||
getCacheMetrics(),
|
||||
getHTTPMetrics(),
|
||||
getNetworkMetrics(),
|
||||
getMinioVersionMetrics(),
|
||||
getS3TTFBMetric(),
|
||||
})
|
||||
|
||||
clusterCollector = newMinioClusterCollector(allMetricsGroups)
|
||||
}
|
||||
|
||||
// MetricNamespace is top level grouping of metrics to create the metric name.
|
||||
type MetricNamespace string
|
||||
|
||||
@ -164,117 +209,37 @@ type Metric struct {
|
||||
Histogram map[string]uint64 `json:"Histogram"`
|
||||
}
|
||||
|
||||
func (m *Metric) copyMetric() Metric {
|
||||
metric := Metric{
|
||||
Description: m.Description,
|
||||
Value: m.Value,
|
||||
HistogramBucketLabel: m.HistogramBucketLabel,
|
||||
StaticLabels: make(map[string]string),
|
||||
VariableLabels: make(map[string]string),
|
||||
Histogram: make(map[string]uint64),
|
||||
}
|
||||
for k, v := range m.StaticLabels {
|
||||
metric.StaticLabels[k] = v
|
||||
}
|
||||
for k, v := range m.VariableLabels {
|
||||
metric.VariableLabels[k] = v
|
||||
}
|
||||
for k, v := range m.Histogram {
|
||||
metric.Histogram[k] = v
|
||||
}
|
||||
return metric
|
||||
}
|
||||
|
||||
// MetricsGroup are a group of metrics that are initialized together.
|
||||
type MetricsGroup struct {
|
||||
id string
|
||||
cacheInterval time.Duration
|
||||
cachedRead func(ctx context.Context, mg *MetricsGroup) []Metric
|
||||
read func(ctx context.Context) []Metric
|
||||
metricsCache timedValue
|
||||
}
|
||||
|
||||
var metricsGroupCache = make(map[string]*timedValue)
|
||||
var cacheLock sync.Mutex
|
||||
|
||||
func cachedRead(ctx context.Context, mg *MetricsGroup) (metrics []Metric) {
|
||||
cacheLock.Lock()
|
||||
defer cacheLock.Unlock()
|
||||
v, ok := metricsGroupCache[mg.id]
|
||||
if !ok {
|
||||
interval := mg.cacheInterval
|
||||
if interval == 0 {
|
||||
interval = 30 * time.Second
|
||||
// RegisterRead register the metrics populator function to be used
|
||||
// to populate new values upon cache invalidation.
|
||||
func (g *MetricsGroup) RegisterRead(read func(ctx context.Context) []Metric) {
|
||||
g.metricsCache.Once.Do(func() {
|
||||
g.metricsCache.TTL = 10 * time.Second
|
||||
g.metricsCache.Update = func() (interface{}, error) {
|
||||
return read(GlobalContext), nil
|
||||
}
|
||||
v = &timedValue{}
|
||||
v.Once.Do(func() {
|
||||
v.Update = func() (interface{}, error) {
|
||||
c := mg.read(ctx)
|
||||
return c, nil
|
||||
}
|
||||
v.TTL = interval
|
||||
})
|
||||
metricsGroupCache[mg.id] = v
|
||||
}
|
||||
c, err := v.Get()
|
||||
|
||||
// Get - returns cached value always upton the configured TTL,
|
||||
// once the TTL expires "read()" registered function is called
|
||||
// to return the new values and updated.
|
||||
func (g *MetricsGroup) Get() []Metric {
|
||||
c, err := g.metricsCache.Get()
|
||||
if err != nil {
|
||||
return []Metric{}
|
||||
}
|
||||
m := c.([]Metric)
|
||||
for i := range m {
|
||||
metrics = append(metrics, m[i].copyMetric())
|
||||
}
|
||||
return metrics
|
||||
|
||||
m, ok := c.([]Metric)
|
||||
if !ok {
|
||||
return []Metric{}
|
||||
}
|
||||
|
||||
// MetricsGenerator are functions that generate metric groups.
|
||||
type MetricsGenerator func() MetricsGroup
|
||||
|
||||
// GetGlobalGenerators gets all the generators the report global metrics pre calculated.
|
||||
func GetGlobalGenerators() []MetricsGenerator {
|
||||
g := []MetricsGenerator{
|
||||
getBucketUsageMetrics,
|
||||
getMinioHealingMetrics,
|
||||
getNodeHealthMetrics,
|
||||
getClusterStorageMetrics,
|
||||
}
|
||||
return g
|
||||
}
|
||||
|
||||
// GetAllGenerators gets all the metric generators.
|
||||
func GetAllGenerators() []MetricsGenerator {
|
||||
g := GetGlobalGenerators()
|
||||
g = append(g, GetGeneratorsForPeer()...)
|
||||
return g
|
||||
}
|
||||
|
||||
// GetGeneratorsForPeer - gets the generators to report to peer.
|
||||
func GetGeneratorsForPeer() []MetricsGenerator {
|
||||
g := []MetricsGenerator{
|
||||
getCacheMetrics,
|
||||
getGoMetrics,
|
||||
getHTTPMetrics,
|
||||
getLocalStorageMetrics,
|
||||
getMinioProcMetrics,
|
||||
getMinioVersionMetrics,
|
||||
getNetworkMetrics,
|
||||
getS3TTFBMetric,
|
||||
getILMNodeMetrics,
|
||||
getScannerNodeMetrics,
|
||||
}
|
||||
return g
|
||||
}
|
||||
|
||||
// GetSingleNodeGenerators gets the metrics that are local
|
||||
func GetSingleNodeGenerators() []MetricsGenerator {
|
||||
g := []MetricsGenerator{
|
||||
getNodeHealthMetrics,
|
||||
getCacheMetrics,
|
||||
getHTTPMetrics,
|
||||
getNetworkMetrics,
|
||||
getMinioVersionMetrics,
|
||||
getS3TTFBMetric,
|
||||
}
|
||||
return g
|
||||
return m
|
||||
}
|
||||
|
||||
func getClusterCapacityTotalBytesMD() MetricDescription {
|
||||
@ -286,6 +251,7 @@ func getClusterCapacityTotalBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getClusterCapacityFreeBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: clusterMetricNamespace,
|
||||
@ -295,6 +261,7 @@ func getClusterCapacityFreeBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getClusterCapacityUsageBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: clusterMetricNamespace,
|
||||
@ -304,6 +271,7 @@ func getClusterCapacityUsageBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getClusterCapacityUsageFreeBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: clusterMetricNamespace,
|
||||
@ -323,6 +291,7 @@ func getNodeDiskUsedBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getNodeDiskFreeBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -332,6 +301,7 @@ func getNodeDiskFreeBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getClusterDisksOfflineTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: clusterMetricNamespace,
|
||||
@ -381,6 +351,7 @@ func getNodeDiskTotalBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getUsageLastScanActivityMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioMetricNamespace,
|
||||
@ -429,6 +400,7 @@ func getBucketRepFailedBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getBucketRepSentBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: bucketMetricNamespace,
|
||||
@ -438,6 +410,7 @@ func getBucketRepSentBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getBucketRepReceivedBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: bucketMetricNamespace,
|
||||
@ -457,6 +430,7 @@ func getBucketRepFailedOperationsMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getBucketObjectDistributionMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: bucketMetricNamespace,
|
||||
@ -466,6 +440,7 @@ func getBucketObjectDistributionMD() MetricDescription {
|
||||
Type: histogramMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getInternodeFailedRequests() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: interNodeMetricNamespace,
|
||||
@ -485,6 +460,7 @@ func getInterNodeSentBytesMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getInterNodeReceivedBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: interNodeMetricNamespace,
|
||||
@ -494,6 +470,7 @@ func getInterNodeReceivedBytesMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3SentBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -503,6 +480,7 @@ func getS3SentBytesMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3ReceivedBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -512,6 +490,7 @@ func getS3ReceivedBytesMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3RequestsInFlightMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -521,6 +500,7 @@ func getS3RequestsInFlightMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3RequestsInQueueMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -530,6 +510,7 @@ func getS3RequestsInQueueMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3RequestsTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -539,6 +520,7 @@ func getS3RequestsTotalMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3RequestsErrorsMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -548,6 +530,7 @@ func getS3RequestsErrorsMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3RequestsCanceledMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -557,6 +540,7 @@ func getS3RequestsCanceledMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3RejectedAuthRequestsTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -566,6 +550,7 @@ func getS3RejectedAuthRequestsTotalMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3RejectedHeaderRequestsTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -575,6 +560,7 @@ func getS3RejectedHeaderRequestsTotalMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3RejectedTimestampRequestsTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -584,6 +570,7 @@ func getS3RejectedTimestampRequestsTotalMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3RejectedInvalidRequestsTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -593,6 +580,7 @@ func getS3RejectedInvalidRequestsTotalMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getCacheHitsTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioNamespace,
|
||||
@ -602,6 +590,7 @@ func getCacheHitsTotalMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getCacheHitsMissedTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioNamespace,
|
||||
@ -611,6 +600,7 @@ func getCacheHitsMissedTotalMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getCacheUsagePercentMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioNamespace,
|
||||
@ -620,6 +610,7 @@ func getCacheUsagePercentMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getCacheUsageInfoMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioNamespace,
|
||||
@ -629,6 +620,7 @@ func getCacheUsageInfoMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getCacheUsedBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioNamespace,
|
||||
@ -638,6 +630,7 @@ func getCacheUsedBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getCacheTotalBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioNamespace,
|
||||
@ -647,6 +640,7 @@ func getCacheTotalBytesMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getCacheSentBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioNamespace,
|
||||
@ -656,6 +650,7 @@ func getCacheSentBytesMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getHealObjectsTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: healMetricNamespace,
|
||||
@ -665,6 +660,7 @@ func getHealObjectsTotalMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getHealObjectsHealTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: healMetricNamespace,
|
||||
@ -684,6 +680,7 @@ func getHealObjectsFailTotalMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getHealLastActivityTimeMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: healMetricNamespace,
|
||||
@ -693,6 +690,7 @@ func getHealLastActivityTimeMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getNodeOnlineTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: clusterMetricNamespace,
|
||||
@ -702,6 +700,7 @@ func getNodeOnlineTotalMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getNodeOfflineTotalMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: clusterMetricNamespace,
|
||||
@ -711,6 +710,7 @@ func getNodeOfflineTotalMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinIOVersionMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioMetricNamespace,
|
||||
@ -720,6 +720,7 @@ func getMinIOVersionMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinIOCommitMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: minioMetricNamespace,
|
||||
@ -729,6 +730,7 @@ func getMinIOCommitMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getS3TTFBDistributionMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: s3MetricNamespace,
|
||||
@ -738,6 +740,7 @@ func getS3TTFBDistributionMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinioFDOpenMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -747,6 +750,7 @@ func getMinioFDOpenMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinioFDLimitMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -756,6 +760,7 @@ func getMinioFDLimitMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinioProcessIOWriteBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -765,6 +770,7 @@ func getMinioProcessIOWriteBytesMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinioProcessIOReadBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -774,6 +780,7 @@ func getMinioProcessIOReadBytesMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinioProcessIOWriteCachedBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -783,6 +790,7 @@ func getMinioProcessIOWriteCachedBytesMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinioProcessIOReadCachedBytesMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -792,6 +800,7 @@ func getMinioProcessIOReadCachedBytesMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinIOProcessSysCallRMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -801,6 +810,7 @@ func getMinIOProcessSysCallRMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinIOProcessSysCallWMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -810,6 +820,7 @@ func getMinIOProcessSysCallWMD() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinIOGORoutineCountMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -819,6 +830,7 @@ func getMinIOGORoutineCountMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinIOProcessStartTimeMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -828,6 +840,7 @@ func getMinIOProcessStartTimeMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinIOProcessUptimeMD() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -837,6 +850,7 @@ func getMinIOProcessUptimeMD() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinIOProcessResidentMemory() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -846,6 +860,7 @@ func getMinIOProcessResidentMemory() MetricDescription {
|
||||
Type: gaugeMetric,
|
||||
}
|
||||
}
|
||||
|
||||
func getMinIOProcessCPUTime() MetricDescription {
|
||||
return MetricDescription{
|
||||
Namespace: nodeMetricNamespace,
|
||||
@ -855,11 +870,10 @@ func getMinIOProcessCPUTime() MetricDescription {
|
||||
Type: counterMetric,
|
||||
}
|
||||
}
|
||||
func getMinioProcMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "MinioProcMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(ctx context.Context) (metrics []Metric) {
|
||||
|
||||
func getMinioProcMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(ctx context.Context) (metrics []Metric) {
|
||||
if runtime.GOOS == "windows" {
|
||||
return nil
|
||||
}
|
||||
@ -958,28 +972,25 @@ func getMinioProcMetrics() MetricsGroup {
|
||||
Value: stat.CPUTime(),
|
||||
})
|
||||
return
|
||||
},
|
||||
})
|
||||
return mg
|
||||
}
|
||||
}
|
||||
func getGoMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "GoMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(ctx context.Context) (metrics []Metric) {
|
||||
|
||||
func getGoMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(ctx context.Context) (metrics []Metric) {
|
||||
metrics = append(metrics, Metric{
|
||||
Description: getMinIOGORoutineCountMD(),
|
||||
Value: float64(runtime.NumGoroutine()),
|
||||
})
|
||||
return
|
||||
},
|
||||
})
|
||||
return mg
|
||||
}
|
||||
}
|
||||
func getS3TTFBMetric() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "s3TTFBMetric",
|
||||
cachedRead: cachedRead,
|
||||
read: func(ctx context.Context) (metrics []Metric) {
|
||||
|
||||
func getS3TTFBMetric() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(ctx context.Context) (metrics []Metric) {
|
||||
// Read prometheus metric on this channel
|
||||
ch := make(chan prometheus.Metric)
|
||||
var wg sync.WaitGroup
|
||||
@ -1017,8 +1028,8 @@ func getS3TTFBMetric() MetricsGroup {
|
||||
close(ch)
|
||||
wg.Wait()
|
||||
return
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
func getTransitionPendingTasksMD() MetricDescription {
|
||||
@ -1051,11 +1062,9 @@ func getExpiryPendingTasksMD() MetricDescription {
|
||||
}
|
||||
}
|
||||
|
||||
func getILMNodeMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "ILMNodeMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(_ context.Context) []Metric {
|
||||
func getILMNodeMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(_ context.Context) []Metric {
|
||||
expPendingTasks := Metric{
|
||||
Description: getExpiryPendingTasksMD(),
|
||||
}
|
||||
@ -1077,15 +1086,13 @@ func getILMNodeMetrics() MetricsGroup {
|
||||
trPendingTasks,
|
||||
trActiveTasks,
|
||||
}
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
func getScannerNodeMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "ScannerNodeMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(_ context.Context) []Metric {
|
||||
func getScannerNodeMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(_ context.Context) []Metric {
|
||||
metrics := []Metric{
|
||||
{
|
||||
Description: MetricDescription{
|
||||
@ -1166,15 +1173,13 @@ func getScannerNodeMetrics() MetricsGroup {
|
||||
})
|
||||
}
|
||||
return metrics
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
func getMinioVersionMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "MinioVersionMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(_ context.Context) (metrics []Metric) {
|
||||
func getMinioVersionMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(_ context.Context) (metrics []Metric) {
|
||||
metrics = append(metrics, Metric{
|
||||
Description: getMinIOCommitMD(),
|
||||
VariableLabels: map[string]string{"commit": CommitID},
|
||||
@ -1184,15 +1189,13 @@ func getMinioVersionMetrics() MetricsGroup {
|
||||
VariableLabels: map[string]string{"version": Version},
|
||||
})
|
||||
return
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
func getNodeHealthMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "NodeHealthMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(_ context.Context) (metrics []Metric) {
|
||||
func getNodeHealthMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(_ context.Context) (metrics []Metric) {
|
||||
if globalIsGateway {
|
||||
return
|
||||
}
|
||||
@ -1207,15 +1210,13 @@ func getNodeHealthMetrics() MetricsGroup {
|
||||
Value: float64(nodesDown),
|
||||
})
|
||||
return
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
func getMinioHealingMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "minioHealingMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(_ context.Context) (metrics []Metric) {
|
||||
func getMinioHealingMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(_ context.Context) (metrics []Metric) {
|
||||
metrics = make([]Metric, 0, 5)
|
||||
if !globalIsErasure {
|
||||
return
|
||||
@ -1237,8 +1238,8 @@ func getMinioHealingMetrics() MetricsGroup {
|
||||
metrics = append(metrics, getHealedItems(bgSeq)...)
|
||||
metrics = append(metrics, getFailedItems(bgSeq)...)
|
||||
return
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
func getFailedItems(seq *healSequence) (m []Metric) {
|
||||
@ -1283,11 +1284,9 @@ func getObjectsScanned(seq *healSequence) (m []Metric) {
|
||||
return
|
||||
}
|
||||
|
||||
func getCacheMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "CacheMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(ctx context.Context) (metrics []Metric) {
|
||||
func getCacheMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(ctx context.Context) (metrics []Metric) {
|
||||
metrics = make([]Metric, 0, 20)
|
||||
cacheObjLayer := newCachedObjectLayerFn()
|
||||
// Service not initialized yet
|
||||
@ -1329,15 +1328,13 @@ func getCacheMetrics() MetricsGroup {
|
||||
})
|
||||
}
|
||||
return
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
func getHTTPMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "httpMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(ctx context.Context) (metrics []Metric) {
|
||||
func getHTTPMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(ctx context.Context) (metrics []Metric) {
|
||||
httpStats := globalHTTPStats.toServerHTTPStats()
|
||||
metrics = make([]Metric, 0, 3+
|
||||
len(httpStats.CurrentS3Requests.APIStats)+
|
||||
@ -1392,15 +1389,13 @@ func getHTTPMetrics() MetricsGroup {
|
||||
})
|
||||
}
|
||||
return
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
func getNetworkMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "networkMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(ctx context.Context) (metrics []Metric) {
|
||||
func getNetworkMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(ctx context.Context) (metrics []Metric) {
|
||||
metrics = make([]Metric, 0, 10)
|
||||
metrics = append(metrics, Metric{
|
||||
Description: getInternodeFailedRequests(),
|
||||
@ -1424,15 +1419,13 @@ func getNetworkMetrics() MetricsGroup {
|
||||
Value: float64(connStats.S3InputBytes),
|
||||
})
|
||||
return
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
func getBucketUsageMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "BucketUsageMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(ctx context.Context) (metrics []Metric) {
|
||||
func getBucketUsageMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(ctx context.Context) (metrics []Metric) {
|
||||
objLayer := newObjectLayerFn()
|
||||
// Service not initialized yet
|
||||
if objLayer == nil || globalIsGateway {
|
||||
@ -1512,14 +1505,13 @@ func getBucketUsageMetrics() MetricsGroup {
|
||||
|
||||
}
|
||||
return
|
||||
},
|
||||
})
|
||||
return mg
|
||||
}
|
||||
}
|
||||
func getLocalStorageMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "localStorageMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(ctx context.Context) (metrics []Metric) {
|
||||
|
||||
func getLocalStorageMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(ctx context.Context) (metrics []Metric) {
|
||||
objLayer := newObjectLayerFn()
|
||||
// Service not initialized yet
|
||||
if objLayer == nil || globalIsGateway {
|
||||
@ -1554,14 +1546,13 @@ func getLocalStorageMetrics() MetricsGroup {
|
||||
})
|
||||
}
|
||||
return
|
||||
},
|
||||
})
|
||||
return mg
|
||||
}
|
||||
}
|
||||
func getClusterStorageMetrics() MetricsGroup {
|
||||
return MetricsGroup{
|
||||
id: "ClusterStorageMetrics",
|
||||
cachedRead: cachedRead,
|
||||
read: func(ctx context.Context) (metrics []Metric) {
|
||||
|
||||
func getClusterStorageMetrics() *MetricsGroup {
|
||||
mg := &MetricsGroup{}
|
||||
mg.RegisterRead(func(ctx context.Context) (metrics []Metric) {
|
||||
objLayer := newObjectLayerFn()
|
||||
// Service not initialized yet
|
||||
if objLayer == nil || !globalIsErasure {
|
||||
@ -1609,17 +1600,19 @@ func getClusterStorageMetrics() MetricsGroup {
|
||||
Value: float64(totalDisks.Sum()),
|
||||
})
|
||||
return
|
||||
},
|
||||
}
|
||||
})
|
||||
return mg
|
||||
}
|
||||
|
||||
type minioClusterCollector struct {
|
||||
metricsGroups []*MetricsGroup
|
||||
desc *prometheus.Desc
|
||||
}
|
||||
|
||||
func newMinioClusterCollector() *minioClusterCollector {
|
||||
func newMinioClusterCollector(metricsGroups []*MetricsGroup) *minioClusterCollector {
|
||||
return &minioClusterCollector{
|
||||
desc: prometheus.NewDesc("minio_stats", "Statistics exposed by MinIO server", nil, nil),
|
||||
metricsGroups: metricsGroups,
|
||||
desc: prometheus.NewDesc("minio_stats", "Statistics exposed by MinIO server per cluster", nil, nil),
|
||||
}
|
||||
}
|
||||
|
||||
@ -1630,7 +1623,6 @@ func (c *minioClusterCollector) Describe(ch chan<- *prometheus.Desc) {
|
||||
|
||||
// Collect is called by the Prometheus registry when collecting metrics.
|
||||
func (c *minioClusterCollector) Collect(out chan<- prometheus.Metric) {
|
||||
|
||||
var wg sync.WaitGroup
|
||||
publish := func(in <-chan Metric) {
|
||||
defer wg.Done()
|
||||
@ -1679,7 +1671,7 @@ func (c *minioClusterCollector) Collect(out chan<- prometheus.Metric) {
|
||||
|
||||
// Call peer api to fetch metrics
|
||||
peerCh := globalNotificationSys.GetClusterMetrics(GlobalContext)
|
||||
selfCh := ReportMetrics(GlobalContext, GetAllGenerators)
|
||||
selfCh := ReportMetrics(GlobalContext, c.metricsGroups)
|
||||
wg.Add(2)
|
||||
go publish(peerCh)
|
||||
go publish(selfCh)
|
||||
@ -1687,11 +1679,11 @@ func (c *minioClusterCollector) Collect(out chan<- prometheus.Metric) {
|
||||
}
|
||||
|
||||
// ReportMetrics reports serialized metrics to the channel passed for the metrics generated.
|
||||
func ReportMetrics(ctx context.Context, generators func() []MetricsGenerator) <-chan Metric {
|
||||
func ReportMetrics(ctx context.Context, metricsGroups []*MetricsGroup) <-chan Metric {
|
||||
ch := make(chan Metric)
|
||||
go func() {
|
||||
defer close(ch)
|
||||
populateAndPublish(generators, func(m Metric) bool {
|
||||
populateAndPublish(metricsGroups, func(m Metric) bool {
|
||||
if m.VariableLabels == nil {
|
||||
m.VariableLabels = make(map[string]string)
|
||||
}
|
||||
@ -1709,24 +1701,24 @@ func ReportMetrics(ctx context.Context, generators func() []MetricsGenerator) <-
|
||||
return ch
|
||||
}
|
||||
|
||||
// minioCollectorV2 is the Custom Collector
|
||||
type minioCollectorV2 struct {
|
||||
generator func() []MetricsGenerator
|
||||
// minioNodeCollector is the Custom Collector
|
||||
type minioNodeCollector struct {
|
||||
metricsGroups []*MetricsGroup
|
||||
desc *prometheus.Desc
|
||||
}
|
||||
|
||||
// Describe sends the super-set of all possible descriptors of metrics
|
||||
func (c *minioCollectorV2) Describe(ch chan<- *prometheus.Desc) {
|
||||
func (c *minioNodeCollector) Describe(ch chan<- *prometheus.Desc) {
|
||||
ch <- c.desc
|
||||
}
|
||||
|
||||
// populateAndPublish populates and then publishes the metrics generated by the generator function.
|
||||
func populateAndPublish(generatorFn func() []MetricsGenerator, publish func(m Metric) bool) {
|
||||
generators := generatorFn()
|
||||
for _, g := range generators {
|
||||
metricsGroup := g()
|
||||
metrics := metricsGroup.cachedRead(GlobalContext, &metricsGroup)
|
||||
for _, metric := range metrics {
|
||||
func populateAndPublish(metricsGroups []*MetricsGroup, publish func(m Metric) bool) {
|
||||
for _, mg := range metricsGroups {
|
||||
if mg == nil {
|
||||
continue
|
||||
}
|
||||
for _, metric := range mg.Get() {
|
||||
if !publish(metric) {
|
||||
return
|
||||
}
|
||||
@ -1735,12 +1727,12 @@ func populateAndPublish(generatorFn func() []MetricsGenerator, publish func(m Me
|
||||
}
|
||||
|
||||
// Collect is called by the Prometheus registry when collecting metrics.
|
||||
func (c *minioCollectorV2) Collect(ch chan<- prometheus.Metric) {
|
||||
func (c *minioNodeCollector) Collect(ch chan<- prometheus.Metric) {
|
||||
|
||||
// Expose MinIO's version information
|
||||
minioVersionInfo.WithLabelValues(Version, CommitID).Set(1.0)
|
||||
|
||||
populateAndPublish(c.generator, func(metric Metric) bool {
|
||||
populateAndPublish(c.metricsGroups, func(metric Metric) bool {
|
||||
labels, values := getOrderedLabelValueArrays(metric.VariableLabels)
|
||||
values = append(values, globalLocalNodeName)
|
||||
labels = append(labels, serverName)
|
||||
@ -1799,30 +1791,31 @@ func getOrderedLabelValueArrays(labelsWithValue map[string]string) (labels, valu
|
||||
return
|
||||
}
|
||||
|
||||
// newMinioCollectorV2 describes the collector
|
||||
// newMinioCollectorNode describes the collector
|
||||
// and returns reference of minioCollector for version 2
|
||||
// It creates the Prometheus Description which is used
|
||||
// to define Metric and help string
|
||||
func newMinioCollectorV2(generator func() []MetricsGenerator) *minioCollectorV2 {
|
||||
return &minioCollectorV2{
|
||||
generator: generator,
|
||||
desc: prometheus.NewDesc("minio_stats", "Statistics exposed by MinIO server", nil, nil),
|
||||
func newMinioCollectorNode(metricsGroups []*MetricsGroup) *minioNodeCollector {
|
||||
return &minioNodeCollector{
|
||||
metricsGroups: metricsGroups,
|
||||
desc: prometheus.NewDesc("minio_stats", "Statistics exposed by MinIO server per node", nil, nil),
|
||||
}
|
||||
}
|
||||
|
||||
func metricsServerHandler() http.Handler {
|
||||
|
||||
registry := prometheus.NewRegistry()
|
||||
|
||||
// Report all other metrics
|
||||
err := registry.Register(newMinioClusterCollector())
|
||||
err := registry.Register(clusterCollector)
|
||||
if err != nil {
|
||||
logger.CriticalIf(GlobalContext, err)
|
||||
}
|
||||
|
||||
// DefaultGatherers include golang metrics and process metrics.
|
||||
gatherers := prometheus.Gatherers{
|
||||
registry,
|
||||
}
|
||||
|
||||
// Delegate http serving to Prometheus client library, which will call collector.Collect.
|
||||
return promhttp.InstrumentMetricHandler(
|
||||
registry,
|
||||
@ -1836,7 +1829,7 @@ func metricsServerHandler() http.Handler {
|
||||
func metricsNodeHandler() http.Handler {
|
||||
registry := prometheus.NewRegistry()
|
||||
|
||||
err := registry.Register(newMinioCollectorV2(GetSingleNodeGenerators))
|
||||
err := registry.Register(nodeCollector)
|
||||
if err != nil {
|
||||
logger.CriticalIf(GlobalContext, err)
|
||||
}
|
||||
|
@ -1113,7 +1113,7 @@ func (s *peerRESTServer) GetPeerMetrics(w http.ResponseWriter, r *http.Request)
|
||||
|
||||
enc := gob.NewEncoder(w)
|
||||
|
||||
ch := ReportMetrics(r.Context(), GetGeneratorsForPeer)
|
||||
ch := ReportMetrics(r.Context(), peerMetricsGroups)
|
||||
for m := range ch {
|
||||
if err := enc.Encode(m); err != nil {
|
||||
s.writeErrorResponse(w, errors.New("Encoding metric failed: "+err.Error()))
|
||||
|
@ -29,6 +29,7 @@ import (
|
||||
"reflect"
|
||||
"strings"
|
||||
"testing"
|
||||
"time"
|
||||
)
|
||||
|
||||
// Tests maximum object size.
|
||||
@ -486,3 +487,32 @@ func TestGetMinioMode(t *testing.T) {
|
||||
testMinioMode(globalMinioModeGatewayPrefix + globalGatewayName)
|
||||
|
||||
}
|
||||
|
||||
func TestTimedValue(t *testing.T) {
|
||||
var cache timedValue
|
||||
t.Parallel()
|
||||
cache.Once.Do(func() {
|
||||
cache.TTL = 2 * time.Second
|
||||
cache.Update = func() (interface{}, error) {
|
||||
return time.Now(), nil
|
||||
}
|
||||
})
|
||||
|
||||
i, _ := cache.Get()
|
||||
t1 := i.(time.Time)
|
||||
|
||||
j, _ := cache.Get()
|
||||
t2 := j.(time.Time)
|
||||
|
||||
if !t1.Equal(t2) {
|
||||
t.Fatalf("expected time to be equal: %s != %s", t1, t2)
|
||||
}
|
||||
|
||||
time.Sleep(3 * time.Second)
|
||||
k, _ := cache.Get()
|
||||
t3 := k.(time.Time)
|
||||
|
||||
if t1.Equal(t3) {
|
||||
t.Fatalf("expected time to be un-equal: %s == %s", t1, t3)
|
||||
}
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user