2023-07-08 10:42:05 -07:00
|
|
|
// Copyright (c) 2015-2022 MinIO, Inc.
|
|
|
|
//
|
|
|
|
// This file is part of MinIO Object Storage stack
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
2022-07-05 14:45:49 -07:00
|
|
|
package cmd
|
|
|
|
|
|
|
|
import (
|
|
|
|
"strings"
|
|
|
|
"sync"
|
|
|
|
"sync/atomic"
|
|
|
|
"time"
|
|
|
|
"unsafe"
|
|
|
|
|
2023-06-19 17:53:08 -07:00
|
|
|
"github.com/minio/madmin-go/v3"
|
2022-07-05 14:45:49 -07:00
|
|
|
"github.com/minio/minio/internal/bucket/lifecycle"
|
|
|
|
)
|
|
|
|
|
|
|
|
//go:generate stringer -type=scannerMetric -trimprefix=scannerMetric $GOFILE
|
|
|
|
|
|
|
|
type scannerMetric uint8
|
|
|
|
|
|
|
|
type scannerMetrics struct {
|
|
|
|
// All fields must be accessed atomically and aligned.
|
|
|
|
operations [scannerMetricLast]uint64
|
|
|
|
latency [scannerMetricLastRealtime]lockedLastMinuteLatency
|
|
|
|
|
|
|
|
// actions records actions performed.
|
|
|
|
actions [lifecycle.ActionCount]uint64
|
|
|
|
actionsLatency [lifecycle.ActionCount]lockedLastMinuteLatency
|
|
|
|
|
|
|
|
// currentPaths contains (string,*currentPathTracker) for each disk processing.
|
|
|
|
// Alignment not required.
|
|
|
|
currentPaths sync.Map
|
|
|
|
|
|
|
|
cycleInfoMu sync.Mutex
|
|
|
|
cycleInfo *currentScannerCycle
|
|
|
|
}
|
|
|
|
|
|
|
|
var globalScannerMetrics scannerMetrics
|
|
|
|
|
|
|
|
const (
|
|
|
|
// START Realtime metrics, that only to records
|
|
|
|
// last minute latencies and total operation count.
|
|
|
|
scannerMetricReadMetadata scannerMetric = iota
|
|
|
|
scannerMetricCheckMissing
|
|
|
|
scannerMetricSaveUsage
|
|
|
|
scannerMetricApplyAll
|
|
|
|
scannerMetricApplyVersion
|
|
|
|
scannerMetricTierObjSweep
|
|
|
|
scannerMetricHealCheck
|
|
|
|
scannerMetricILM
|
|
|
|
scannerMetricCheckReplication
|
|
|
|
scannerMetricYield
|
2022-11-28 19:20:55 +01:00
|
|
|
scannerMetricCleanAbandoned
|
|
|
|
scannerMetricApplyNonCurrent
|
2023-09-24 22:15:31 -07:00
|
|
|
scannerMetricHealAbandonedVersion
|
2022-07-05 14:45:49 -07:00
|
|
|
|
|
|
|
// START Trace metrics:
|
|
|
|
scannerMetricStartTrace
|
|
|
|
scannerMetricScanObject // Scan object. All operations included.
|
2023-09-24 22:15:31 -07:00
|
|
|
scannerMetricHealAbandonedObject
|
2022-07-05 14:45:49 -07:00
|
|
|
|
|
|
|
// END realtime metrics:
|
|
|
|
scannerMetricLastRealtime
|
|
|
|
|
|
|
|
// Trace only metrics:
|
2022-12-01 14:31:35 -08:00
|
|
|
scannerMetricScanFolder // Scan a folder on disk, recursively.
|
|
|
|
scannerMetricScanCycle // Full cycle, cluster global
|
|
|
|
scannerMetricScanBucketDrive // Single bucket on one drive
|
2022-12-05 20:18:50 +01:00
|
|
|
scannerMetricCompactFolder // Folder compacted.
|
2022-07-05 14:45:49 -07:00
|
|
|
|
|
|
|
// Must be last:
|
|
|
|
scannerMetricLast
|
|
|
|
)
|
|
|
|
|
|
|
|
// log scanner action.
|
|
|
|
// Use for s > scannerMetricStartTrace
|
2023-02-21 18:33:33 +01:00
|
|
|
func (p *scannerMetrics) log(s scannerMetric, paths ...string) func(custom map[string]string) {
|
2022-07-05 14:45:49 -07:00
|
|
|
startTime := time.Now()
|
2023-02-21 18:33:33 +01:00
|
|
|
return func(custom map[string]string) {
|
2022-07-05 14:45:49 -07:00
|
|
|
duration := time.Since(startTime)
|
|
|
|
|
|
|
|
atomic.AddUint64(&p.operations[s], 1)
|
|
|
|
if s < scannerMetricLastRealtime {
|
|
|
|
p.latency[s].add(duration)
|
|
|
|
}
|
|
|
|
|
|
|
|
if s > scannerMetricStartTrace && globalTrace.NumSubscribers(madmin.TraceScanner) > 0 {
|
2023-02-21 18:33:33 +01:00
|
|
|
globalTrace.Publish(scannerTrace(s, startTime, duration, strings.Join(paths, " "), custom))
|
2022-07-05 14:45:49 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// time a scanner action.
|
|
|
|
// Use for s < scannerMetricLastRealtime
|
|
|
|
func (p *scannerMetrics) time(s scannerMetric) func() {
|
|
|
|
startTime := time.Now()
|
|
|
|
return func() {
|
|
|
|
duration := time.Since(startTime)
|
|
|
|
|
|
|
|
atomic.AddUint64(&p.operations[s], 1)
|
|
|
|
if s < scannerMetricLastRealtime {
|
|
|
|
p.latency[s].add(duration)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// timeSize add time and size of a scanner action.
|
|
|
|
// Use for s < scannerMetricLastRealtime
|
|
|
|
func (p *scannerMetrics) timeSize(s scannerMetric) func(sz int) {
|
|
|
|
startTime := time.Now()
|
|
|
|
return func(sz int) {
|
|
|
|
duration := time.Since(startTime)
|
|
|
|
|
|
|
|
atomic.AddUint64(&p.operations[s], 1)
|
|
|
|
if s < scannerMetricLastRealtime {
|
|
|
|
p.latency[s].addSize(duration, int64(sz))
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// incTime will increment time on metric s with a specific duration.
|
|
|
|
// Use for s < scannerMetricLastRealtime
|
|
|
|
func (p *scannerMetrics) incTime(s scannerMetric, d time.Duration) {
|
|
|
|
atomic.AddUint64(&p.operations[s], 1)
|
|
|
|
if s < scannerMetricLastRealtime {
|
|
|
|
p.latency[s].add(d)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// timeILM times an ILM action.
|
|
|
|
// lifecycle.NoneAction is ignored.
|
|
|
|
// Use for s < scannerMetricLastRealtime
|
2023-08-09 08:55:19 -07:00
|
|
|
func (p *scannerMetrics) timeILM(a lifecycle.Action) func(versions uint64) {
|
2022-07-05 14:45:49 -07:00
|
|
|
if a == lifecycle.NoneAction || a >= lifecycle.ActionCount {
|
2023-08-09 08:55:19 -07:00
|
|
|
return func(_ uint64) {}
|
2022-07-05 14:45:49 -07:00
|
|
|
}
|
|
|
|
startTime := time.Now()
|
2023-08-09 08:55:19 -07:00
|
|
|
return func(versions uint64) {
|
2022-07-05 14:45:49 -07:00
|
|
|
duration := time.Since(startTime)
|
2023-08-09 08:55:19 -07:00
|
|
|
atomic.AddUint64(&p.actions[a], versions)
|
2022-07-05 14:45:49 -07:00
|
|
|
p.actionsLatency[a].add(duration)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
type currentPathTracker struct {
|
|
|
|
name *unsafe.Pointer // contains atomically accessed *string
|
|
|
|
}
|
|
|
|
|
|
|
|
// currentPathUpdater provides a lightweight update function for keeping track of
|
|
|
|
// current objects for each disk.
|
|
|
|
// Returns a function that can be used to update the current object
|
|
|
|
// and a function to call to when processing finished.
|
|
|
|
func (p *scannerMetrics) currentPathUpdater(disk, initial string) (update func(path string), done func()) {
|
|
|
|
initialPtr := unsafe.Pointer(&initial)
|
|
|
|
tracker := ¤tPathTracker{
|
|
|
|
name: &initialPtr,
|
|
|
|
}
|
|
|
|
|
|
|
|
p.currentPaths.Store(disk, tracker)
|
|
|
|
return func(path string) {
|
|
|
|
atomic.StorePointer(tracker.name, unsafe.Pointer(&path))
|
|
|
|
}, func() {
|
|
|
|
p.currentPaths.Delete(disk)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// getCurrentPaths returns the paths currently being processed.
|
|
|
|
func (p *scannerMetrics) getCurrentPaths() []string {
|
|
|
|
var res []string
|
2022-07-06 07:48:38 -07:00
|
|
|
prefix := globalLocalNodeName + "/"
|
2022-07-05 14:45:49 -07:00
|
|
|
p.currentPaths.Range(func(key, value interface{}) bool {
|
|
|
|
// We are a bit paranoid, but better miss an entry than crash.
|
|
|
|
name, ok := key.(string)
|
|
|
|
if !ok {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
obj, ok := value.(*currentPathTracker)
|
|
|
|
if !ok {
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
strptr := (*string)(atomic.LoadPointer(obj.name))
|
|
|
|
if strptr != nil {
|
2022-07-06 07:48:38 -07:00
|
|
|
res = append(res, pathJoin(prefix, name, *strptr))
|
2022-07-05 14:45:49 -07:00
|
|
|
}
|
|
|
|
return true
|
|
|
|
})
|
|
|
|
return res
|
|
|
|
}
|
|
|
|
|
2022-12-01 14:31:35 -08:00
|
|
|
// activeDrives returns the number of currently active disks.
|
2022-07-05 14:45:49 -07:00
|
|
|
// (since this is concurrent it may not be 100% reliable)
|
2022-12-01 14:31:35 -08:00
|
|
|
func (p *scannerMetrics) activeDrives() int {
|
2022-07-05 14:45:49 -07:00
|
|
|
var i int
|
|
|
|
p.currentPaths.Range(func(k, v interface{}) bool {
|
|
|
|
i++
|
|
|
|
return true
|
|
|
|
})
|
|
|
|
return i
|
|
|
|
}
|
|
|
|
|
|
|
|
// lifetime returns the lifetime count of the specified metric.
|
|
|
|
func (p *scannerMetrics) lifetime(m scannerMetric) uint64 {
|
2022-12-05 20:18:50 +01:00
|
|
|
if m >= scannerMetricLast {
|
2022-07-05 14:45:49 -07:00
|
|
|
return 0
|
|
|
|
}
|
|
|
|
val := atomic.LoadUint64(&p.operations[m])
|
|
|
|
return val
|
|
|
|
}
|
|
|
|
|
|
|
|
// lastMinute returns the last minute statistics of a metric.
|
|
|
|
// m should be < scannerMetricLastRealtime
|
|
|
|
func (p *scannerMetrics) lastMinute(m scannerMetric) AccElem {
|
2022-12-05 20:18:50 +01:00
|
|
|
if m >= scannerMetricLastRealtime {
|
2022-07-05 14:45:49 -07:00
|
|
|
return AccElem{}
|
|
|
|
}
|
|
|
|
val := p.latency[m].total()
|
|
|
|
return val
|
|
|
|
}
|
|
|
|
|
|
|
|
// lifetimeActions returns the lifetime count of the specified ilm metric.
|
|
|
|
func (p *scannerMetrics) lifetimeActions(a lifecycle.Action) uint64 {
|
|
|
|
if a == lifecycle.NoneAction || a >= lifecycle.ActionCount {
|
|
|
|
return 0
|
|
|
|
}
|
|
|
|
val := atomic.LoadUint64(&p.actions[a])
|
|
|
|
return val
|
|
|
|
}
|
|
|
|
|
|
|
|
// lastMinuteActions returns the last minute statistics of an ilm metric.
|
|
|
|
func (p *scannerMetrics) lastMinuteActions(a lifecycle.Action) AccElem {
|
|
|
|
if a == lifecycle.NoneAction || a >= lifecycle.ActionCount {
|
|
|
|
return AccElem{}
|
|
|
|
}
|
|
|
|
val := p.actionsLatency[a].total()
|
|
|
|
return val
|
|
|
|
}
|
|
|
|
|
|
|
|
// setCycle updates the current cycle metrics.
|
|
|
|
func (p *scannerMetrics) setCycle(c *currentScannerCycle) {
|
|
|
|
if c != nil {
|
|
|
|
c2 := c.clone()
|
|
|
|
c = &c2
|
|
|
|
}
|
|
|
|
p.cycleInfoMu.Lock()
|
|
|
|
p.cycleInfo = c
|
|
|
|
p.cycleInfoMu.Unlock()
|
|
|
|
}
|
|
|
|
|
|
|
|
// getCycle returns the current cycle metrics.
|
|
|
|
// If not nil, the returned value can safely be modified.
|
|
|
|
func (p *scannerMetrics) getCycle() *currentScannerCycle {
|
|
|
|
p.cycleInfoMu.Lock()
|
|
|
|
defer p.cycleInfoMu.Unlock()
|
|
|
|
if p.cycleInfo == nil {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
c := p.cycleInfo.clone()
|
|
|
|
return &c
|
|
|
|
}
|
|
|
|
|
|
|
|
func (p *scannerMetrics) report() madmin.ScannerMetrics {
|
|
|
|
var m madmin.ScannerMetrics
|
|
|
|
cycle := p.getCycle()
|
|
|
|
if cycle != nil {
|
|
|
|
m.CurrentCycle = cycle.current
|
|
|
|
m.CyclesCompletedAt = cycle.cycleCompleted
|
|
|
|
m.CurrentStarted = cycle.started
|
|
|
|
}
|
|
|
|
m.CollectedAt = time.Now()
|
|
|
|
m.ActivePaths = p.getCurrentPaths()
|
|
|
|
m.LifeTimeOps = make(map[string]uint64, scannerMetricLast)
|
|
|
|
for i := scannerMetric(0); i < scannerMetricLast; i++ {
|
|
|
|
if n := atomic.LoadUint64(&p.operations[i]); n > 0 {
|
|
|
|
m.LifeTimeOps[i.String()] = n
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if len(m.LifeTimeOps) == 0 {
|
|
|
|
m.LifeTimeOps = nil
|
|
|
|
}
|
|
|
|
|
|
|
|
m.LastMinute.Actions = make(map[string]madmin.TimedAction, scannerMetricLastRealtime)
|
|
|
|
for i := scannerMetric(0); i < scannerMetricLastRealtime; i++ {
|
|
|
|
lm := p.lastMinute(i)
|
|
|
|
if lm.N > 0 {
|
|
|
|
m.LastMinute.Actions[i.String()] = lm.asTimedAction()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if len(m.LastMinute.Actions) == 0 {
|
|
|
|
m.LastMinute.Actions = nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// ILM
|
|
|
|
m.LifeTimeILM = make(map[string]uint64)
|
|
|
|
for i := lifecycle.NoneAction + 1; i < lifecycle.ActionCount; i++ {
|
|
|
|
if n := atomic.LoadUint64(&p.actions[i]); n > 0 {
|
|
|
|
m.LifeTimeILM[i.String()] = n
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if len(m.LifeTimeILM) == 0 {
|
|
|
|
m.LifeTimeILM = nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if len(m.LifeTimeILM) > 0 {
|
|
|
|
m.LastMinute.ILM = make(map[string]madmin.TimedAction, len(m.LifeTimeILM))
|
|
|
|
for i := lifecycle.NoneAction + 1; i < lifecycle.ActionCount; i++ {
|
|
|
|
lm := p.lastMinuteActions(i)
|
|
|
|
if lm.N > 0 {
|
|
|
|
m.LastMinute.ILM[i.String()] = madmin.TimedAction{Count: uint64(lm.N), AccTime: uint64(lm.Total)}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if len(m.LastMinute.ILM) == 0 {
|
|
|
|
m.LastMinute.ILM = nil
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return m
|
|
|
|
}
|