mirror of
https://github.com/minio/minio.git
synced 2025-01-11 15:03:22 -05:00
fix: rename crawler as scanner in config (#11549)
This commit is contained in:
parent
11b2220696
commit
ffea6fcf09
@ -50,10 +50,14 @@ import (
|
|||||||
var serverDebugLog = env.Get("_MINIO_SERVER_DEBUG", config.EnableOff) == config.EnableOn
|
var serverDebugLog = env.Get("_MINIO_SERVER_DEBUG", config.EnableOff) == config.EnableOn
|
||||||
|
|
||||||
func init() {
|
func init() {
|
||||||
|
rand.Seed(time.Now().UTC().UnixNano())
|
||||||
|
|
||||||
logger.Init(GOPATH, GOROOT)
|
logger.Init(GOPATH, GOROOT)
|
||||||
logger.RegisterError(config.FmtError)
|
logger.RegisterError(config.FmtError)
|
||||||
|
|
||||||
rand.Seed(time.Now().UTC().UnixNano())
|
// Inject into config package.
|
||||||
|
config.Logger.Info = logger.Info
|
||||||
|
config.Logger.LogIf = logger.LogIf
|
||||||
|
|
||||||
globalDNSCache = xhttp.NewDNSCache(10*time.Second, 10*time.Second, logger.LogOnceIf)
|
globalDNSCache = xhttp.NewDNSCache(10*time.Second, 10*time.Second, logger.LogOnceIf)
|
||||||
|
|
||||||
|
@ -27,7 +27,6 @@ import (
|
|||||||
"github.com/minio/minio/cmd/config/api"
|
"github.com/minio/minio/cmd/config/api"
|
||||||
"github.com/minio/minio/cmd/config/cache"
|
"github.com/minio/minio/cmd/config/cache"
|
||||||
"github.com/minio/minio/cmd/config/compress"
|
"github.com/minio/minio/cmd/config/compress"
|
||||||
"github.com/minio/minio/cmd/config/crawler"
|
|
||||||
"github.com/minio/minio/cmd/config/dns"
|
"github.com/minio/minio/cmd/config/dns"
|
||||||
"github.com/minio/minio/cmd/config/etcd"
|
"github.com/minio/minio/cmd/config/etcd"
|
||||||
"github.com/minio/minio/cmd/config/heal"
|
"github.com/minio/minio/cmd/config/heal"
|
||||||
@ -35,6 +34,7 @@ import (
|
|||||||
"github.com/minio/minio/cmd/config/identity/openid"
|
"github.com/minio/minio/cmd/config/identity/openid"
|
||||||
"github.com/minio/minio/cmd/config/notify"
|
"github.com/minio/minio/cmd/config/notify"
|
||||||
"github.com/minio/minio/cmd/config/policy/opa"
|
"github.com/minio/minio/cmd/config/policy/opa"
|
||||||
|
"github.com/minio/minio/cmd/config/scanner"
|
||||||
"github.com/minio/minio/cmd/config/storageclass"
|
"github.com/minio/minio/cmd/config/storageclass"
|
||||||
"github.com/minio/minio/cmd/crypto"
|
"github.com/minio/minio/cmd/crypto"
|
||||||
xhttp "github.com/minio/minio/cmd/http"
|
xhttp "github.com/minio/minio/cmd/http"
|
||||||
@ -60,7 +60,7 @@ func initHelp() {
|
|||||||
config.LoggerWebhookSubSys: logger.DefaultKVS,
|
config.LoggerWebhookSubSys: logger.DefaultKVS,
|
||||||
config.AuditWebhookSubSys: logger.DefaultAuditKVS,
|
config.AuditWebhookSubSys: logger.DefaultAuditKVS,
|
||||||
config.HealSubSys: heal.DefaultKVS,
|
config.HealSubSys: heal.DefaultKVS,
|
||||||
config.CrawlerSubSys: crawler.DefaultKVS,
|
config.ScannerSubSys: scanner.DefaultKVS,
|
||||||
}
|
}
|
||||||
for k, v := range notify.DefaultNotificationKVS {
|
for k, v := range notify.DefaultNotificationKVS {
|
||||||
kvs[k] = v
|
kvs[k] = v
|
||||||
@ -117,8 +117,8 @@ func initHelp() {
|
|||||||
Description: "manage object healing frequency and bitrot verification checks",
|
Description: "manage object healing frequency and bitrot verification checks",
|
||||||
},
|
},
|
||||||
config.HelpKV{
|
config.HelpKV{
|
||||||
Key: config.CrawlerSubSys,
|
Key: config.ScannerSubSys,
|
||||||
Description: "manage crawling for usage calculation, lifecycle, healing and more",
|
Description: "manage scanner for usage calculation, lifecycle, healing and more",
|
||||||
},
|
},
|
||||||
config.HelpKV{
|
config.HelpKV{
|
||||||
Key: config.LoggerWebhookSubSys,
|
Key: config.LoggerWebhookSubSys,
|
||||||
@ -200,7 +200,7 @@ func initHelp() {
|
|||||||
config.CacheSubSys: cache.Help,
|
config.CacheSubSys: cache.Help,
|
||||||
config.CompressionSubSys: compress.Help,
|
config.CompressionSubSys: compress.Help,
|
||||||
config.HealSubSys: heal.Help,
|
config.HealSubSys: heal.Help,
|
||||||
config.CrawlerSubSys: crawler.Help,
|
config.ScannerSubSys: scanner.Help,
|
||||||
config.IdentityOpenIDSubSys: openid.Help,
|
config.IdentityOpenIDSubSys: openid.Help,
|
||||||
config.IdentityLDAPSubSys: xldap.Help,
|
config.IdentityLDAPSubSys: xldap.Help,
|
||||||
config.PolicyOPASubSys: opa.Help,
|
config.PolicyOPASubSys: opa.Help,
|
||||||
@ -274,11 +274,11 @@ func validateConfig(s config.Config, setDriveCounts []int) error {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
if _, err := heal.LookupConfig(s[config.HealSubSys][config.Default]); err != nil {
|
if _, err = heal.LookupConfig(s[config.HealSubSys][config.Default]); err != nil {
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
if _, err := crawler.LookupConfig(s[config.CrawlerSubSys][config.Default]); err != nil {
|
if _, err = scanner.LookupConfig(s[config.ScannerSubSys][config.Default]); err != nil {
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -606,10 +606,10 @@ func applyDynamicConfig(ctx context.Context, objAPI ObjectLayer, s config.Config
|
|||||||
return fmt.Errorf("Unable to apply heal config: %w", err)
|
return fmt.Errorf("Unable to apply heal config: %w", err)
|
||||||
}
|
}
|
||||||
|
|
||||||
// Crawler
|
// Scanner
|
||||||
crawlerCfg, err := crawler.LookupConfig(s[config.CrawlerSubSys][config.Default])
|
scannerCfg, err := scanner.LookupConfig(s[config.ScannerSubSys][config.Default])
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return fmt.Errorf("Unable to apply crawler config: %w", err)
|
return fmt.Errorf("Unable to apply scanner config: %w", err)
|
||||||
}
|
}
|
||||||
|
|
||||||
// Apply configurations.
|
// Apply configurations.
|
||||||
@ -624,7 +624,7 @@ func applyDynamicConfig(ctx context.Context, objAPI ObjectLayer, s config.Config
|
|||||||
globalHealConfig = healCfg
|
globalHealConfig = healCfg
|
||||||
globalHealConfigMu.Unlock()
|
globalHealConfigMu.Unlock()
|
||||||
|
|
||||||
logger.LogIf(ctx, crawlerSleeper.Update(crawlerCfg.Delay, crawlerCfg.MaxWait))
|
logger.LogIf(ctx, scannerSleeper.Update(scannerCfg.Delay, scannerCfg.MaxWait))
|
||||||
|
|
||||||
// Update all dynamic config values in memory.
|
// Update all dynamic config values in memory.
|
||||||
globalServerConfigMu.Lock()
|
globalServerConfigMu.Lock()
|
||||||
|
@ -77,6 +77,7 @@ const (
|
|||||||
LoggerWebhookSubSys = "logger_webhook"
|
LoggerWebhookSubSys = "logger_webhook"
|
||||||
AuditWebhookSubSys = "audit_webhook"
|
AuditWebhookSubSys = "audit_webhook"
|
||||||
HealSubSys = "heal"
|
HealSubSys = "heal"
|
||||||
|
ScannerSubSys = "scanner"
|
||||||
CrawlerSubSys = "crawler"
|
CrawlerSubSys = "crawler"
|
||||||
|
|
||||||
// Add new constants here if you add new fields to config.
|
// Add new constants here if you add new fields to config.
|
||||||
@ -114,7 +115,7 @@ var SubSystems = set.CreateStringSet(
|
|||||||
PolicyOPASubSys,
|
PolicyOPASubSys,
|
||||||
IdentityLDAPSubSys,
|
IdentityLDAPSubSys,
|
||||||
IdentityOpenIDSubSys,
|
IdentityOpenIDSubSys,
|
||||||
CrawlerSubSys,
|
ScannerSubSys,
|
||||||
HealSubSys,
|
HealSubSys,
|
||||||
NotifyAMQPSubSys,
|
NotifyAMQPSubSys,
|
||||||
NotifyESSubSys,
|
NotifyESSubSys,
|
||||||
@ -132,7 +133,7 @@ var SubSystems = set.CreateStringSet(
|
|||||||
var SubSystemsDynamic = set.CreateStringSet(
|
var SubSystemsDynamic = set.CreateStringSet(
|
||||||
APISubSys,
|
APISubSys,
|
||||||
CompressionSubSys,
|
CompressionSubSys,
|
||||||
CrawlerSubSys,
|
ScannerSubSys,
|
||||||
HealSubSys,
|
HealSubSys,
|
||||||
)
|
)
|
||||||
|
|
||||||
@ -151,7 +152,7 @@ var SubSystemsSingleTargets = set.CreateStringSet([]string{
|
|||||||
IdentityLDAPSubSys,
|
IdentityLDAPSubSys,
|
||||||
IdentityOpenIDSubSys,
|
IdentityOpenIDSubSys,
|
||||||
HealSubSys,
|
HealSubSys,
|
||||||
CrawlerSubSys,
|
ScannerSubSys,
|
||||||
}...)
|
}...)
|
||||||
|
|
||||||
// Constant separators
|
// Constant separators
|
||||||
@ -462,6 +463,13 @@ func LookupWorm() (bool, error) {
|
|||||||
return ParseBool(env.Get(EnvWorm, EnableOff))
|
return ParseBool(env.Get(EnvWorm, EnableOff))
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Carries all the renamed sub-systems from their
|
||||||
|
// previously known names
|
||||||
|
var renamedSubsys = map[string]string{
|
||||||
|
CrawlerSubSys: ScannerSubSys,
|
||||||
|
// Add future sub-system renames
|
||||||
|
}
|
||||||
|
|
||||||
// Merge - merges a new config with all the
|
// Merge - merges a new config with all the
|
||||||
// missing values for default configs,
|
// missing values for default configs,
|
||||||
// returns a config.
|
// returns a config.
|
||||||
@ -477,9 +485,21 @@ func (c Config) Merge() Config {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
if _, ok := cp[subSys]; !ok {
|
if _, ok := cp[subSys]; !ok {
|
||||||
// A config subsystem was removed or server was downgraded.
|
rnSubSys, ok := renamedSubsys[subSys]
|
||||||
Logger.Info("config: ignoring unknown subsystem config %q\n", subSys)
|
if !ok {
|
||||||
continue
|
// A config subsystem was removed or server was downgraded.
|
||||||
|
Logger.Info("config: ignoring unknown subsystem config %q\n", subSys)
|
||||||
|
continue
|
||||||
|
}
|
||||||
|
// Copy over settings from previous sub-system
|
||||||
|
// to newly renamed sub-system
|
||||||
|
for _, kv := range cp[rnSubSys][Default] {
|
||||||
|
_, ok := c[subSys][tgt].Lookup(kv.Key)
|
||||||
|
if !ok {
|
||||||
|
ckvs.Set(kv.Key, kv.Value)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
subSys = rnSubSys
|
||||||
}
|
}
|
||||||
cp[subSys][tgt] = ckvs
|
cp[subSys][tgt] = ckvs
|
||||||
}
|
}
|
||||||
|
@ -14,7 +14,7 @@
|
|||||||
* limitations under the License.
|
* limitations under the License.
|
||||||
*/
|
*/
|
||||||
|
|
||||||
package crawler
|
package scanner
|
||||||
|
|
||||||
import (
|
import (
|
||||||
"strconv"
|
"strconv"
|
||||||
@ -29,8 +29,10 @@ const (
|
|||||||
Delay = "delay"
|
Delay = "delay"
|
||||||
MaxWait = "max_wait"
|
MaxWait = "max_wait"
|
||||||
|
|
||||||
EnvDelay = "MINIO_CRAWLER_DELAY"
|
EnvDelay = "MINIO_SCANNER_DELAY"
|
||||||
EnvMaxWait = "MINIO_CRAWLER_MAX_WAIT"
|
EnvDelayLegacy = "MINIO_CRAWLER_DELAY"
|
||||||
|
EnvMaxWait = "MINIO_SCANNER_MAX_WAIT"
|
||||||
|
EnvMaxWaitLegacy = "MINIO_CRAWLER_MAX_WAIT"
|
||||||
)
|
)
|
||||||
|
|
||||||
// Config represents the heal settings.
|
// Config represents the heal settings.
|
||||||
@ -58,7 +60,7 @@ var (
|
|||||||
Help = config.HelpKVS{
|
Help = config.HelpKVS{
|
||||||
config.HelpKV{
|
config.HelpKV{
|
||||||
Key: Delay,
|
Key: Delay,
|
||||||
Description: `crawler delay multiplier, defaults to '10.0'`,
|
Description: `scanner delay multiplier, defaults to '10.0'`,
|
||||||
Optional: true,
|
Optional: true,
|
||||||
Type: "float",
|
Type: "float",
|
||||||
},
|
},
|
||||||
@ -73,14 +75,22 @@ var (
|
|||||||
|
|
||||||
// LookupConfig - lookup config and override with valid environment settings if any.
|
// LookupConfig - lookup config and override with valid environment settings if any.
|
||||||
func LookupConfig(kvs config.KVS) (cfg Config, err error) {
|
func LookupConfig(kvs config.KVS) (cfg Config, err error) {
|
||||||
if err = config.CheckValidKeys(config.CrawlerSubSys, kvs, DefaultKVS); err != nil {
|
if err = config.CheckValidKeys(config.ScannerSubSys, kvs, DefaultKVS); err != nil {
|
||||||
return cfg, err
|
return cfg, err
|
||||||
}
|
}
|
||||||
cfg.Delay, err = strconv.ParseFloat(env.Get(EnvDelay, kvs.Get(Delay)), 64)
|
delay := env.Get(EnvDelayLegacy, "")
|
||||||
|
if delay == "" {
|
||||||
|
delay = env.Get(EnvDelay, kvs.Get(Delay))
|
||||||
|
}
|
||||||
|
cfg.Delay, err = strconv.ParseFloat(delay, 64)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return cfg, err
|
return cfg, err
|
||||||
}
|
}
|
||||||
cfg.MaxWait, err = time.ParseDuration(env.Get(EnvMaxWait, kvs.Get(MaxWait)))
|
maxWait := env.Get(EnvMaxWaitLegacy, "")
|
||||||
|
if maxWait == "" {
|
||||||
|
maxWait = env.Get(EnvMaxWait, kvs.Get(MaxWait))
|
||||||
|
}
|
||||||
|
cfg.MaxWait, err = time.ParseDuration(maxWait)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return cfg, err
|
return cfg, err
|
||||||
}
|
}
|
@ -56,25 +56,25 @@ var (
|
|||||||
globalHealConfig heal.Config
|
globalHealConfig heal.Config
|
||||||
globalHealConfigMu sync.Mutex
|
globalHealConfigMu sync.Mutex
|
||||||
|
|
||||||
dataCrawlerLeaderLockTimeout = newDynamicTimeout(30*time.Second, 10*time.Second)
|
dataScannerLeaderLockTimeout = newDynamicTimeout(30*time.Second, 10*time.Second)
|
||||||
// Sleeper values are updated when config is loaded.
|
// Sleeper values are updated when config is loaded.
|
||||||
crawlerSleeper = newDynamicSleeper(10, 10*time.Second)
|
scannerSleeper = newDynamicSleeper(10, 10*time.Second)
|
||||||
)
|
)
|
||||||
|
|
||||||
// initDataCrawler will start the crawler in the background.
|
// initDataScanner will start the scanner in the background.
|
||||||
func initDataCrawler(ctx context.Context, objAPI ObjectLayer) {
|
func initDataScanner(ctx context.Context, objAPI ObjectLayer) {
|
||||||
go runDataCrawler(ctx, objAPI)
|
go runDataScanner(ctx, objAPI)
|
||||||
}
|
}
|
||||||
|
|
||||||
// runDataCrawler will start a data crawler.
|
// runDataScanner will start a data scanner.
|
||||||
// The function will block until the context is canceled.
|
// The function will block until the context is canceled.
|
||||||
// There should only ever be one crawler running per cluster.
|
// There should only ever be one scanner running per cluster.
|
||||||
func runDataCrawler(ctx context.Context, objAPI ObjectLayer) {
|
func runDataScanner(ctx context.Context, objAPI ObjectLayer) {
|
||||||
// Make sure only 1 crawler is running on the cluster.
|
// Make sure only 1 scanner is running on the cluster.
|
||||||
locker := objAPI.NewNSLock(minioMetaBucket, "runDataCrawler.lock")
|
locker := objAPI.NewNSLock(minioMetaBucket, "runDataScanner.lock")
|
||||||
r := rand.New(rand.NewSource(time.Now().UnixNano()))
|
r := rand.New(rand.NewSource(time.Now().UnixNano()))
|
||||||
for {
|
for {
|
||||||
err := locker.GetLock(ctx, dataCrawlerLeaderLockTimeout)
|
err := locker.GetLock(ctx, dataScannerLeaderLockTimeout)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
time.Sleep(time.Duration(r.Float64() * float64(dataCrawlStartDelay)))
|
time.Sleep(time.Duration(r.Float64() * float64(dataCrawlStartDelay)))
|
||||||
continue
|
continue
|
||||||
@ -112,7 +112,7 @@ func runDataCrawler(ctx context.Context, objAPI ObjectLayer) {
|
|||||||
crawlTimer.Reset(dataCrawlStartDelay)
|
crawlTimer.Reset(dataCrawlStartDelay)
|
||||||
|
|
||||||
if intDataUpdateTracker.debug {
|
if intDataUpdateTracker.debug {
|
||||||
console.Debugln("starting crawler cycle")
|
console.Debugln("starting scanner cycle")
|
||||||
}
|
}
|
||||||
|
|
||||||
// Wait before starting next cycle and wait on startup.
|
// Wait before starting next cycle and wait on startup.
|
||||||
@ -167,7 +167,7 @@ type folderScanner struct {
|
|||||||
|
|
||||||
// crawlDataFolder will crawl the basepath+cache.Info.Name and return an updated cache.
|
// crawlDataFolder will crawl the basepath+cache.Info.Name and return an updated cache.
|
||||||
// The returned cache will always be valid, but may not be updated from the existing.
|
// The returned cache will always be valid, but may not be updated from the existing.
|
||||||
// Before each operation sleepDuration is called which can be used to temporarily halt the crawler.
|
// Before each operation sleepDuration is called which can be used to temporarily halt the scanner.
|
||||||
// If the supplied context is canceled the function will return at the first chance.
|
// If the supplied context is canceled the function will return at the first chance.
|
||||||
func crawlDataFolder(ctx context.Context, basePath string, cache dataUsageCache, getSize getSizeFn) (dataUsageCache, error) {
|
func crawlDataFolder(ctx context.Context, basePath string, cache dataUsageCache, getSize getSizeFn) (dataUsageCache, error) {
|
||||||
t := UTCNow()
|
t := UTCNow()
|
||||||
@ -390,12 +390,12 @@ func (f *folderScanner) scanQueuedLevels(ctx context.Context, folders []cachedFo
|
|||||||
if f.dataUsageCrawlDebug {
|
if f.dataUsageCrawlDebug {
|
||||||
console.Debugf(scannerLogPrefix+" Adding non-updated folder to heal check: %v\n", folder.name)
|
console.Debugf(scannerLogPrefix+" Adding non-updated folder to heal check: %v\n", folder.name)
|
||||||
}
|
}
|
||||||
// If probability was already crawlerHealFolderInclude, keep it.
|
// If probability was already scannerHealFolderInclude, keep it.
|
||||||
folder.objectHealProbDiv = f.healFolderInclude
|
folder.objectHealProbDiv = f.healFolderInclude
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
crawlerSleeper.Sleep(ctx, dataCrawlSleepPerFolder)
|
scannerSleeper.Sleep(ctx, dataCrawlSleepPerFolder)
|
||||||
|
|
||||||
cache := dataUsageEntry{}
|
cache := dataUsageEntry{}
|
||||||
|
|
||||||
@ -447,7 +447,7 @@ func (f *folderScanner) scanQueuedLevels(ctx context.Context, folders []cachedFo
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Dynamic time delay.
|
// Dynamic time delay.
|
||||||
wait := crawlerSleeper.Timer(ctx)
|
wait := scannerSleeper.Timer(ctx)
|
||||||
|
|
||||||
// Get file size, ignore errors.
|
// Get file size, ignore errors.
|
||||||
item := crawlItem{
|
item := crawlItem{
|
||||||
@ -537,7 +537,7 @@ func (f *folderScanner) scanQueuedLevels(ctx context.Context, folders []cachedFo
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Dynamic time delay.
|
// Dynamic time delay.
|
||||||
wait := crawlerSleeper.Timer(ctx)
|
wait := scannerSleeper.Timer(ctx)
|
||||||
resolver.bucket = bucket
|
resolver.bucket = bucket
|
||||||
|
|
||||||
foundObjs := false
|
foundObjs := false
|
||||||
@ -567,7 +567,7 @@ func (f *folderScanner) scanQueuedLevels(ctx context.Context, folders []cachedFo
|
|||||||
|
|
||||||
// Sleep and reset.
|
// Sleep and reset.
|
||||||
wait()
|
wait()
|
||||||
wait = crawlerSleeper.Timer(ctx)
|
wait = scannerSleeper.Timer(ctx)
|
||||||
entry, ok := entries.resolve(&resolver)
|
entry, ok := entries.resolve(&resolver)
|
||||||
if !ok {
|
if !ok {
|
||||||
for _, err := range errs {
|
for _, err := range errs {
|
||||||
@ -604,7 +604,7 @@ func (f *folderScanner) scanQueuedLevels(ctx context.Context, folders []cachedFo
|
|||||||
for _, ver := range fiv.Versions {
|
for _, ver := range fiv.Versions {
|
||||||
// Sleep and reset.
|
// Sleep and reset.
|
||||||
wait()
|
wait()
|
||||||
wait = crawlerSleeper.Timer(ctx)
|
wait = scannerSleeper.Timer(ctx)
|
||||||
err := bgSeq.queueHealTask(healSource{
|
err := bgSeq.queueHealTask(healSource{
|
||||||
bucket: bucket,
|
bucket: bucket,
|
||||||
object: fiv.Name,
|
object: fiv.Name,
|
||||||
@ -640,9 +640,9 @@ func (f *folderScanner) scanQueuedLevels(ctx context.Context, folders []cachedFo
|
|||||||
Remove: true,
|
Remove: true,
|
||||||
},
|
},
|
||||||
func(bucket, object, versionID string) error {
|
func(bucket, object, versionID string) error {
|
||||||
// Wait for each heal as per crawler frequency.
|
// Wait for each heal as per scanner frequency.
|
||||||
wait()
|
wait()
|
||||||
wait = crawlerSleeper.Timer(ctx)
|
wait = scannerSleeper.Timer(ctx)
|
||||||
return bgSeq.queueHealTask(healSource{
|
return bgSeq.queueHealTask(healSource{
|
||||||
bucket: bucket,
|
bucket: bucket,
|
||||||
object: object,
|
object: object,
|
||||||
@ -690,12 +690,12 @@ func (f *folderScanner) deepScanFolder(ctx context.Context, folder cachedFolder,
|
|||||||
dirStack = append(dirStack, entName)
|
dirStack = append(dirStack, entName)
|
||||||
err := readDirFn(path.Join(dirStack...), addDir)
|
err := readDirFn(path.Join(dirStack...), addDir)
|
||||||
dirStack = dirStack[:len(dirStack)-1]
|
dirStack = dirStack[:len(dirStack)-1]
|
||||||
crawlerSleeper.Sleep(ctx, dataCrawlSleepPerFolder)
|
scannerSleeper.Sleep(ctx, dataCrawlSleepPerFolder)
|
||||||
return err
|
return err
|
||||||
}
|
}
|
||||||
|
|
||||||
// Dynamic time delay.
|
// Dynamic time delay.
|
||||||
wait := crawlerSleeper.Timer(ctx)
|
wait := scannerSleeper.Timer(ctx)
|
||||||
|
|
||||||
// Get file size, ignore errors.
|
// Get file size, ignore errors.
|
||||||
dirStack = append(dirStack, entName)
|
dirStack = append(dirStack, entName)
|
@ -91,7 +91,7 @@ type dataUsageCacheInfo struct {
|
|||||||
Name string
|
Name string
|
||||||
LastUpdate time.Time
|
LastUpdate time.Time
|
||||||
NextCycle uint32
|
NextCycle uint32
|
||||||
// indicates if the disk is being healed and crawler
|
// indicates if the disk is being healed and scanner
|
||||||
// should skip healing the disk
|
// should skip healing the disk
|
||||||
SkipHealing bool
|
SkipHealing bool
|
||||||
BloomFilter []byte `msg:"BloomFilter,omitempty"`
|
BloomFilter []byte `msg:"BloomFilter,omitempty"`
|
||||||
|
@ -401,7 +401,7 @@ func (z *erasureServerPools) CrawlAndGetDataUsage(ctx context.Context, bf *bloom
|
|||||||
mu.Unlock()
|
mu.Unlock()
|
||||||
}
|
}
|
||||||
}()
|
}()
|
||||||
// Start crawler. Blocks until done.
|
// Start scanner. Blocks until done.
|
||||||
err := erObj.crawlAndGetDataUsage(ctx, allBuckets, bf, updates)
|
err := erObj.crawlAndGetDataUsage(ctx, allBuckets, bf, updates)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
logger.LogIf(ctx, err)
|
logger.LogIf(ctx, err)
|
||||||
|
@ -260,7 +260,7 @@ func (er erasureObjects) getOnlineDisksWithHealing() (newDisks []StorageAPI, hea
|
|||||||
|
|
||||||
for i, info := range infos {
|
for i, info := range infos {
|
||||||
// Check if one of the drives in the set is being healed.
|
// Check if one of the drives in the set is being healed.
|
||||||
// this information is used by crawler to skip healing
|
// this information is used by scanner to skip healing
|
||||||
// this erasure set while it calculates the usage.
|
// this erasure set while it calculates the usage.
|
||||||
if info.Healing || info.Error != "" {
|
if info.Healing || info.Error != "" {
|
||||||
healing = true
|
healing = true
|
||||||
@ -378,7 +378,7 @@ func (er erasureObjects) crawlAndGetDataUsage(ctx context.Context, buckets []Buc
|
|||||||
}
|
}
|
||||||
}()
|
}()
|
||||||
|
|
||||||
// Start one crawler per disk
|
// Start one scanner per disk
|
||||||
var wg sync.WaitGroup
|
var wg sync.WaitGroup
|
||||||
wg.Add(len(disks))
|
wg.Add(len(disks))
|
||||||
for i := range disks {
|
for i := range disks {
|
||||||
|
@ -56,12 +56,6 @@ const (
|
|||||||
EnvAuditWebhookAuthToken = "MINIO_AUDIT_WEBHOOK_AUTH_TOKEN"
|
EnvAuditWebhookAuthToken = "MINIO_AUDIT_WEBHOOK_AUTH_TOKEN"
|
||||||
)
|
)
|
||||||
|
|
||||||
// Inject into config package.
|
|
||||||
func init() {
|
|
||||||
config.Logger.Info = Info
|
|
||||||
config.Logger.LogIf = LogIf
|
|
||||||
}
|
|
||||||
|
|
||||||
// Default KVS for loggerHTTP and loggerAuditHTTP
|
// Default KVS for loggerHTTP and loggerAuditHTTP
|
||||||
var (
|
var (
|
||||||
DefaultKVS = config.KVS{
|
DefaultKVS = config.KVS{
|
||||||
|
@ -145,7 +145,7 @@ func (m *metacache) worthKeeping(currentCycle uint64) bool {
|
|||||||
// Cycle is somehow bigger.
|
// Cycle is somehow bigger.
|
||||||
return false
|
return false
|
||||||
case cache.finished() && time.Since(cache.lastHandout) > 48*time.Hour:
|
case cache.finished() && time.Since(cache.lastHandout) > 48*time.Hour:
|
||||||
// Keep only for 2 days. Fallback if crawler is clogged.
|
// Keep only for 2 days. Fallback if scanner is clogged.
|
||||||
return false
|
return false
|
||||||
case cache.finished() && currentCycle >= dataUsageUpdateDirCycles && cache.startedCycle < currentCycle-dataUsageUpdateDirCycles:
|
case cache.finished() && currentCycle >= dataUsageUpdateDirCycles && cache.startedCycle < currentCycle-dataUsageUpdateDirCycles:
|
||||||
// Cycle is too old to be valuable.
|
// Cycle is too old to be valuable.
|
||||||
|
@ -419,7 +419,7 @@ func networkMetricsPrometheus(ch chan<- prometheus.Metric) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Populates prometheus with bucket usage metrics, this metrics
|
// Populates prometheus with bucket usage metrics, this metrics
|
||||||
// is only enabled if crawler is enabled.
|
// is only enabled if scanner is enabled.
|
||||||
func bucketUsageMetricsPrometheus(ch chan<- prometheus.Metric) {
|
func bucketUsageMetricsPrometheus(ch chan<- prometheus.Metric) {
|
||||||
objLayer := newObjectLayerFn()
|
objLayer := newObjectLayerFn()
|
||||||
// Service not initialized yet
|
// Service not initialized yet
|
||||||
|
@ -509,7 +509,7 @@ func serverMain(ctx *cli.Context) {
|
|||||||
initBackgroundExpiry(GlobalContext, newObject)
|
initBackgroundExpiry(GlobalContext, newObject)
|
||||||
}
|
}
|
||||||
|
|
||||||
initDataCrawler(GlobalContext, newObject)
|
initDataScanner(GlobalContext, newObject)
|
||||||
|
|
||||||
if err = initServer(GlobalContext, newObject); err != nil {
|
if err = initServer(GlobalContext, newObject); err != nil {
|
||||||
var cerr config.Err
|
var cerr config.Err
|
||||||
|
@ -263,36 +263,36 @@ The following sub-systems are dynamic i.e., configuration parameters for each su
|
|||||||
```
|
```
|
||||||
api manage global HTTP API call specific features, such as throttling, authentication types, etc.
|
api manage global HTTP API call specific features, such as throttling, authentication types, etc.
|
||||||
heal manage object healing frequency and bitrot verification checks
|
heal manage object healing frequency and bitrot verification checks
|
||||||
crawler manage crawling for usage calculation, lifecycle, healing and more
|
scanner manage crawling for usage calculation, lifecycle, healing and more
|
||||||
```
|
```
|
||||||
|
|
||||||
> NOTE: if you set any of the following sub-system configuration using ENVs, dynamic behavior is not supported.
|
> NOTE: if you set any of the following sub-system configuration using ENVs, dynamic behavior is not supported.
|
||||||
|
|
||||||
### Usage crawler
|
### Usage scanner
|
||||||
|
|
||||||
Data usage crawler is enabled by default. The following configuration settings allow for more staggered delay in terms of usage calculation. The crawler adapts to the system speed and completely pauses when the system is under load. It is possible to adjust the speed of the crawler and thereby the latency of updates being reflected. The delays between each operation of the crawl can be adjusted by the `mc admin config set alias/ delay=15.0`. By default the value is `10.0`. This means the crawler will sleep *10x* the time each operation takes.
|
Data usage scanner is enabled by default. The following configuration settings allow for more staggered delay in terms of usage calculation. The scanner adapts to the system speed and completely pauses when the system is under load. It is possible to adjust the speed of the scanner and thereby the latency of updates being reflected. The delays between each operation of the crawl can be adjusted by the `mc admin config set alias/ delay=15.0`. By default the value is `10.0`. This means the scanner will sleep *10x* the time each operation takes.
|
||||||
|
|
||||||
In most setups this will keep the crawler slow enough to not impact overall system performance. Setting the `delay` key to a *lower* value will make the crawler faster and setting it to 0 will make the crawler run at full speed (not recommended in production). Setting it to a higher value will make the crawler slower, consuming less resources with the trade off of not collecting metrics for operations like healing and disk usage as fast.
|
In most setups this will keep the scanner slow enough to not impact overall system performance. Setting the `delay` key to a *lower* value will make the scanner faster and setting it to 0 will make the scanner run at full speed (not recommended in production). Setting it to a higher value will make the scanner slower, consuming less resources with the trade off of not collecting metrics for operations like healing and disk usage as fast.
|
||||||
|
|
||||||
```
|
```
|
||||||
~ mc admin config set alias/ crawler
|
~ mc admin config set alias/ scanner
|
||||||
KEY:
|
KEY:
|
||||||
crawler manage crawling for usage calculation, lifecycle, healing and more
|
scanner manage crawling for usage calculation, lifecycle, healing and more
|
||||||
|
|
||||||
ARGS:
|
ARGS:
|
||||||
delay (float) crawler delay multiplier, defaults to '10.0'
|
delay (float) scanner delay multiplier, defaults to '10.0'
|
||||||
max_wait (duration) maximum wait time between operations, defaults to '15s'
|
max_wait (duration) maximum wait time between operations, defaults to '15s'
|
||||||
```
|
```
|
||||||
|
|
||||||
Example: Following setting will decrease the crawler speed by a factor of 3, reducing the system resource use, but increasing the latency of updates being reflected.
|
Example: Following setting will decrease the scanner speed by a factor of 3, reducing the system resource use, but increasing the latency of updates being reflected.
|
||||||
|
|
||||||
```sh
|
```sh
|
||||||
~ mc admin config set alias/ crawler delay=30.0
|
~ mc admin config set alias/ scanner delay=30.0
|
||||||
```
|
```
|
||||||
|
|
||||||
Once set the crawler settings are automatically applied without the need for server restarts.
|
Once set the scanner settings are automatically applied without the need for server restarts.
|
||||||
|
|
||||||
> NOTE: Data usage crawler is not supported under Gateway deployments.
|
> NOTE: Data usage scanner is not supported under Gateway deployments.
|
||||||
|
|
||||||
### Healing
|
### Healing
|
||||||
|
|
||||||
|
Loading…
Reference in New Issue
Block a user