2021-04-18 12:41:13 -07:00
|
|
|
// Copyright (c) 2015-2021 MinIO, Inc.
|
|
|
|
//
|
|
|
|
// This file is part of MinIO Object Storage stack
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
2017-08-14 18:08:42 -07:00
|
|
|
|
|
|
|
package cmd
|
|
|
|
|
|
|
|
import (
|
2018-04-05 15:04:40 -07:00
|
|
|
"context"
|
2020-08-03 18:17:48 -07:00
|
|
|
"errors"
|
2020-06-12 20:04:01 -07:00
|
|
|
"fmt"
|
2021-02-18 00:38:37 -08:00
|
|
|
"math/rand"
|
2021-02-26 09:52:27 -08:00
|
|
|
"os"
|
2022-08-08 16:16:44 -07:00
|
|
|
"runtime"
|
2020-06-12 20:04:01 -07:00
|
|
|
"sort"
|
2020-05-09 18:54:20 +02:00
|
|
|
"sync"
|
2020-06-12 20:04:01 -07:00
|
|
|
"time"
|
2017-08-14 18:08:42 -07:00
|
|
|
|
2023-06-19 17:53:08 -07:00
|
|
|
"github.com/minio/madmin-go/v3"
|
2021-06-01 14:59:40 -07:00
|
|
|
"github.com/minio/minio/internal/bpool"
|
|
|
|
"github.com/minio/minio/internal/dsync"
|
2023-08-14 12:28:13 -07:00
|
|
|
xioutil "github.com/minio/minio/internal/ioutil"
|
2021-06-01 14:59:40 -07:00
|
|
|
"github.com/minio/minio/internal/logger"
|
2023-04-26 11:27:40 +05:30
|
|
|
"github.com/minio/pkg/sync/errgroup"
|
2017-08-14 18:08:42 -07:00
|
|
|
)
|
|
|
|
|
2023-01-17 19:37:47 +05:30
|
|
|
// list all errors that can be ignore in a bucket operation.
|
|
|
|
var bucketOpIgnoredErrs = append(baseIgnoredErrs, errDiskAccessDenied, errUnformattedDisk)
|
|
|
|
|
|
|
|
// list all errors that can be ignored in a bucket metadata operation.
|
|
|
|
var bucketMetadataOpIgnoredErrs = append(bucketOpIgnoredErrs, errVolumeNotFound)
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// OfflineDisk represents an unavailable disk.
|
|
|
|
var OfflineDisk StorageAPI // zero value is nil
|
|
|
|
|
|
|
|
// erasureObjects - Implements ER object layer.
|
|
|
|
type erasureObjects struct {
|
2021-01-16 12:08:02 -08:00
|
|
|
setDriveCount int
|
|
|
|
defaultParityCount int
|
2020-12-07 10:04:07 -08:00
|
|
|
|
2021-03-04 14:36:23 -08:00
|
|
|
setIndex int
|
|
|
|
poolIndex int
|
2021-01-26 22:21:51 +01:00
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// getDisks returns list of storageAPIs.
|
|
|
|
getDisks func() []StorageAPI
|
|
|
|
|
|
|
|
// getLockers returns list of remote and local lockers.
|
2020-09-25 19:21:52 -07:00
|
|
|
getLockers func() ([]dsync.NetLocker, string)
|
2020-06-12 20:04:01 -07:00
|
|
|
|
|
|
|
// getEndpoints returns list of endpoint strings belonging this set.
|
|
|
|
// some may be local and some remote.
|
2021-09-29 19:36:19 +01:00
|
|
|
getEndpoints func() []Endpoint
|
2020-06-12 20:04:01 -07:00
|
|
|
|
|
|
|
// Locker mutex map.
|
|
|
|
nsMutex *nsLockMap
|
|
|
|
|
|
|
|
// Byte pools used for temporary i/o buffers.
|
|
|
|
bp *bpool.BytePoolCap
|
|
|
|
|
2021-06-07 10:06:06 -07:00
|
|
|
// Byte pools used for temporary i/o buffers,
|
|
|
|
// legacy objects.
|
|
|
|
bpOld *bpool.BytePoolCap
|
2017-08-14 18:08:42 -07:00
|
|
|
}
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// NewNSLock - initialize a new namespace RWLocker instance.
|
2020-11-04 08:25:42 -08:00
|
|
|
func (er erasureObjects) NewNSLock(bucket string, objects ...string) RWLocker {
|
|
|
|
return er.nsMutex.NewNSLock(er.getLockers, bucket, objects...)
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// Shutdown function for object storage interface.
|
|
|
|
func (er erasureObjects) Shutdown(ctx context.Context) error {
|
|
|
|
// Add any object layer shutdown activities here.
|
2022-05-30 10:58:37 -07:00
|
|
|
closeStorageDisks(er.getDisks()...)
|
2020-06-12 20:04:01 -07:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2021-12-28 12:41:52 -08:00
|
|
|
// defaultWQuorum write quorum based on setDriveCount and defaultParityCount
|
|
|
|
func (er erasureObjects) defaultWQuorum() int {
|
|
|
|
dataCount := er.setDriveCount - er.defaultParityCount
|
|
|
|
if dataCount == er.defaultParityCount {
|
|
|
|
return dataCount + 1
|
|
|
|
}
|
|
|
|
return dataCount
|
|
|
|
}
|
|
|
|
|
2020-07-13 09:51:07 -07:00
|
|
|
func diskErrToDriveState(err error) (state string) {
|
2020-08-03 18:17:48 -07:00
|
|
|
switch {
|
2022-10-18 11:01:16 +01:00
|
|
|
case errors.Is(err, errDiskNotFound) || errors.Is(err, context.DeadlineExceeded):
|
2020-07-13 09:51:07 -07:00
|
|
|
state = madmin.DriveStateOffline
|
2020-08-03 18:17:48 -07:00
|
|
|
case errors.Is(err, errCorruptedFormat):
|
2020-07-13 09:51:07 -07:00
|
|
|
state = madmin.DriveStateCorrupt
|
2020-08-03 18:17:48 -07:00
|
|
|
case errors.Is(err, errUnformattedDisk):
|
2020-07-13 09:51:07 -07:00
|
|
|
state = madmin.DriveStateUnformatted
|
2020-08-03 18:17:48 -07:00
|
|
|
case errors.Is(err, errDiskAccessDenied):
|
2020-07-13 09:51:07 -07:00
|
|
|
state = madmin.DriveStatePermission
|
2020-08-03 18:17:48 -07:00
|
|
|
case errors.Is(err, errFaultyDisk):
|
2020-07-13 09:51:07 -07:00
|
|
|
state = madmin.DriveStateFaulty
|
2020-08-03 18:17:48 -07:00
|
|
|
case err == nil:
|
2020-07-13 09:51:07 -07:00
|
|
|
state = madmin.DriveStateOk
|
2022-10-14 00:41:44 +01:00
|
|
|
default:
|
|
|
|
state = fmt.Sprintf("%s (cause: %s)", madmin.DriveStateUnknown, err)
|
2020-07-13 09:51:07 -07:00
|
|
|
}
|
2022-10-14 00:41:44 +01:00
|
|
|
|
2020-07-13 09:51:07 -07:00
|
|
|
return
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
|
|
|
|
2020-12-21 18:35:19 +01:00
|
|
|
func getOnlineOfflineDisksStats(disksInfo []madmin.Disk) (onlineDisks, offlineDisks madmin.BackendDisks) {
|
2020-06-12 20:04:01 -07:00
|
|
|
onlineDisks = make(madmin.BackendDisks)
|
|
|
|
offlineDisks = make(madmin.BackendDisks)
|
|
|
|
|
2020-12-21 18:35:19 +01:00
|
|
|
for _, disk := range disksInfo {
|
|
|
|
ep := disk.Endpoint
|
2020-06-29 13:07:26 -07:00
|
|
|
if _, ok := offlineDisks[ep]; !ok {
|
|
|
|
offlineDisks[ep] = 0
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
2020-06-29 13:07:26 -07:00
|
|
|
if _, ok := onlineDisks[ep]; !ok {
|
|
|
|
onlineDisks[ep] = 0
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
2017-08-14 18:08:42 -07:00
|
|
|
}
|
2020-05-09 18:54:20 +02:00
|
|
|
|
2020-12-21 18:35:19 +01:00
|
|
|
// Wait for the routines.
|
|
|
|
for _, disk := range disksInfo {
|
|
|
|
ep := disk.Endpoint
|
|
|
|
state := disk.State
|
|
|
|
if state != madmin.DriveStateOk && state != madmin.DriveStateUnformatted {
|
|
|
|
offlineDisks[ep]++
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
onlineDisks[ep]++
|
|
|
|
}
|
|
|
|
|
|
|
|
rootDiskCount := 0
|
|
|
|
for _, di := range disksInfo {
|
|
|
|
if di.RootDisk {
|
|
|
|
rootDiskCount++
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Count offline disks as well to ensure consistent
|
|
|
|
// reportability of offline drives on local setups.
|
|
|
|
if len(disksInfo) == (rootDiskCount + offlineDisks.Sum()) {
|
|
|
|
// Success.
|
|
|
|
return onlineDisks, offlineDisks
|
|
|
|
}
|
|
|
|
|
|
|
|
// Root disk should be considered offline
|
|
|
|
for i := range disksInfo {
|
|
|
|
ep := disksInfo[i].Endpoint
|
|
|
|
if disksInfo[i].RootDisk {
|
|
|
|
offlineDisks[ep]++
|
|
|
|
onlineDisks[ep]--
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return onlineDisks, offlineDisks
|
|
|
|
}
|
|
|
|
|
|
|
|
// getDisksInfo - fetch disks info across all other storage API.
|
2022-12-01 14:31:35 -08:00
|
|
|
func getDisksInfo(disks []StorageAPI, endpoints []Endpoint) (disksInfo []madmin.Disk) {
|
2020-12-21 18:35:19 +01:00
|
|
|
disksInfo = make([]madmin.Disk, len(disks))
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
g := errgroup.WithNErrs(len(disks))
|
|
|
|
for index := range disks {
|
|
|
|
index := index
|
|
|
|
g.Go(func() error {
|
2023-07-20 15:48:21 +01:00
|
|
|
di := madmin.Disk{
|
|
|
|
Endpoint: endpoints[index].String(),
|
|
|
|
PoolIndex: endpoints[index].PoolIdx,
|
|
|
|
SetIndex: endpoints[index].SetIdx,
|
|
|
|
DiskIndex: endpoints[index].DiskIdx,
|
|
|
|
}
|
2020-06-12 20:04:01 -07:00
|
|
|
if disks[index] == OfflineDisk {
|
2023-07-20 15:48:21 +01:00
|
|
|
logger.LogOnceIf(GlobalContext, fmt.Errorf("%s: %s", errDiskNotFound, endpoints[index]), "get-disks-info-offline-"+di.Endpoint)
|
|
|
|
di.State = diskErrToDriveState(errDiskNotFound)
|
|
|
|
disksInfo[index] = di
|
2022-12-01 14:31:35 -08:00
|
|
|
return nil
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
2023-07-31 15:20:48 -07:00
|
|
|
info, err := disks[index].DiskInfo(context.TODO(), true)
|
2023-07-20 15:48:21 +01:00
|
|
|
di.DrivePath = info.MountPath
|
|
|
|
di.TotalSpace = info.Total
|
|
|
|
di.UsedSpace = info.Used
|
|
|
|
di.AvailableSpace = info.Free
|
|
|
|
di.UUID = info.ID
|
|
|
|
di.Major = info.Major
|
|
|
|
di.Minor = info.Minor
|
|
|
|
di.RootDisk = info.RootDisk
|
|
|
|
di.Healing = info.Healing
|
|
|
|
di.Scanning = info.Scanning
|
|
|
|
di.State = diskErrToDriveState(err)
|
|
|
|
di.FreeInodes = info.FreeInodes
|
|
|
|
di.UsedInodes = info.UsedInodes
|
2021-03-04 14:36:23 -08:00
|
|
|
if info.Healing {
|
|
|
|
if hi := disks[index].Healing(); hi != nil {
|
|
|
|
hd := hi.toHealingDisk()
|
|
|
|
di.HealInfo = &hd
|
|
|
|
}
|
|
|
|
}
|
2021-03-17 04:06:57 +01:00
|
|
|
di.Metrics = &madmin.DiskMetrics{
|
2023-08-01 12:47:50 -07:00
|
|
|
LastMinute: make(map[string]madmin.TimedAction, len(info.Metrics.LastMinute)),
|
|
|
|
APICalls: make(map[string]uint64, len(info.Metrics.APICalls)),
|
|
|
|
TotalErrorsAvailability: info.Metrics.TotalErrorsAvailability,
|
|
|
|
TotalErrorsTimeout: info.Metrics.TotalErrorsTimeout,
|
2021-03-17 04:06:57 +01:00
|
|
|
}
|
2022-07-05 14:45:49 -07:00
|
|
|
for k, v := range info.Metrics.LastMinute {
|
|
|
|
if v.N > 0 {
|
|
|
|
di.Metrics.LastMinute[k] = v.asTimedAction()
|
|
|
|
}
|
2021-03-17 04:06:57 +01:00
|
|
|
}
|
|
|
|
for k, v := range info.Metrics.APICalls {
|
|
|
|
di.Metrics.APICalls[k] = v
|
|
|
|
}
|
2020-07-13 09:51:07 -07:00
|
|
|
if info.Total > 0 {
|
|
|
|
di.Utilization = float64(info.Used / info.Total * 100)
|
|
|
|
}
|
|
|
|
disksInfo[index] = di
|
2022-12-01 14:31:35 -08:00
|
|
|
return nil
|
2020-06-12 20:04:01 -07:00
|
|
|
}, index)
|
2020-05-09 18:54:20 +02:00
|
|
|
}
|
|
|
|
|
2022-12-01 14:31:35 -08:00
|
|
|
g.Wait()
|
|
|
|
return disksInfo
|
2017-08-14 18:08:42 -07:00
|
|
|
}
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// Get an aggregated storage info across all disks.
|
2022-12-01 14:31:35 -08:00
|
|
|
func getStorageInfo(disks []StorageAPI, endpoints []Endpoint) StorageInfo {
|
|
|
|
disksInfo := getDisksInfo(disks, endpoints)
|
2020-06-12 20:04:01 -07:00
|
|
|
|
|
|
|
// Sort so that the first element is the smallest.
|
2023-04-24 13:28:18 -07:00
|
|
|
sort.Slice(disksInfo, func(i, j int) bool {
|
|
|
|
return disksInfo[i].TotalSpace < disksInfo[j].TotalSpace
|
|
|
|
})
|
2020-06-12 20:04:01 -07:00
|
|
|
|
|
|
|
storageInfo := StorageInfo{
|
2020-07-13 09:51:07 -07:00
|
|
|
Disks: disksInfo,
|
2017-08-14 18:08:42 -07:00
|
|
|
}
|
2020-06-12 20:04:01 -07:00
|
|
|
|
2021-03-04 14:36:23 -08:00
|
|
|
storageInfo.Backend.Type = madmin.Erasure
|
2022-12-01 14:31:35 -08:00
|
|
|
return storageInfo
|
2017-08-14 18:08:42 -07:00
|
|
|
}
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// StorageInfo - returns underlying storage statistics.
|
2022-12-01 14:31:35 -08:00
|
|
|
func (er erasureObjects) StorageInfo(ctx context.Context) StorageInfo {
|
2020-06-12 20:04:01 -07:00
|
|
|
disks := er.getDisks()
|
2020-06-29 13:07:26 -07:00
|
|
|
endpoints := er.getEndpoints()
|
|
|
|
return getStorageInfo(disks, endpoints)
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
|
|
|
|
2021-03-02 17:28:04 -08:00
|
|
|
// LocalStorageInfo - returns underlying local storage statistics.
|
2022-12-01 14:31:35 -08:00
|
|
|
func (er erasureObjects) LocalStorageInfo(ctx context.Context) StorageInfo {
|
2021-09-29 19:36:19 +01:00
|
|
|
disks := er.getDisks()
|
|
|
|
endpoints := er.getEndpoints()
|
|
|
|
|
|
|
|
var localDisks []StorageAPI
|
|
|
|
var localEndpoints []Endpoint
|
|
|
|
|
|
|
|
for i, endpoint := range endpoints {
|
|
|
|
if endpoint.IsLocal {
|
|
|
|
localDisks = append(localDisks, disks[i])
|
|
|
|
localEndpoints = append(localEndpoints, endpoint)
|
2021-03-02 17:28:04 -08:00
|
|
|
}
|
|
|
|
}
|
2021-09-29 19:36:19 +01:00
|
|
|
|
|
|
|
return getStorageInfo(localDisks, localEndpoints)
|
2021-03-02 17:28:04 -08:00
|
|
|
}
|
|
|
|
|
2021-01-19 02:40:52 -08:00
|
|
|
func (er erasureObjects) getOnlineDisksWithHealing() (newDisks []StorageAPI, healing bool) {
|
|
|
|
var wg sync.WaitGroup
|
|
|
|
disks := er.getDisks()
|
|
|
|
infos := make([]DiskInfo, len(disks))
|
2023-07-14 02:25:40 -07:00
|
|
|
r := rand.New(rand.NewSource(time.Now().UnixNano()))
|
|
|
|
for _, i := range r.Perm(len(disks)) {
|
2021-01-19 02:40:52 -08:00
|
|
|
i := i
|
|
|
|
wg.Add(1)
|
|
|
|
go func() {
|
|
|
|
defer wg.Done()
|
|
|
|
|
2023-07-14 02:25:40 -07:00
|
|
|
disk := disks[i]
|
2021-01-19 02:40:52 -08:00
|
|
|
if disk == nil {
|
2023-07-14 02:25:40 -07:00
|
|
|
infos[i].Error = "offline drive"
|
2021-01-19 02:40:52 -08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2023-07-31 15:20:48 -07:00
|
|
|
di, err := disk.DiskInfo(context.Background(), false)
|
2023-07-14 02:25:40 -07:00
|
|
|
if err != nil || di.Healing {
|
2021-01-19 02:40:52 -08:00
|
|
|
// - Do not consume disks which are not reachable
|
|
|
|
// unformatted or simply not accessible for some reason.
|
|
|
|
//
|
|
|
|
//
|
|
|
|
// - Future: skip busy disks
|
2023-07-14 02:25:40 -07:00
|
|
|
if err != nil {
|
|
|
|
infos[i].Error = err.Error()
|
|
|
|
}
|
2021-01-19 02:40:52 -08:00
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2023-07-14 02:25:40 -07:00
|
|
|
infos[i] = di
|
2021-01-19 02:40:52 -08:00
|
|
|
}()
|
|
|
|
}
|
|
|
|
wg.Wait()
|
|
|
|
|
2023-08-09 12:51:47 -07:00
|
|
|
var scanningDisks []StorageAPI
|
2021-01-19 02:40:52 -08:00
|
|
|
for i, info := range infos {
|
|
|
|
// Check if one of the drives in the set is being healed.
|
2021-02-17 12:04:11 -08:00
|
|
|
// this information is used by scanner to skip healing
|
2021-01-19 02:40:52 -08:00
|
|
|
// this erasure set while it calculates the usage.
|
2021-02-02 17:04:37 -08:00
|
|
|
if info.Healing || info.Error != "" {
|
2021-01-19 02:40:52 -08:00
|
|
|
healing = true
|
|
|
|
continue
|
|
|
|
}
|
2023-08-09 12:51:47 -07:00
|
|
|
if !info.Scanning {
|
|
|
|
newDisks = append(newDisks, disks[i])
|
|
|
|
} else {
|
|
|
|
scanningDisks = append(scanningDisks, disks[i])
|
|
|
|
}
|
2021-01-19 02:40:52 -08:00
|
|
|
}
|
|
|
|
|
2023-08-09 12:51:47 -07:00
|
|
|
// Prefer new disks over disks which are currently being scanned.
|
|
|
|
newDisks = append(newDisks, scanningDisks...)
|
|
|
|
|
2021-01-19 02:40:52 -08:00
|
|
|
return newDisks, healing
|
|
|
|
}
|
|
|
|
|
2021-02-26 09:52:27 -08:00
|
|
|
// Clean-up previously deleted objects. from .minio.sys/tmp/.trash/
|
|
|
|
func (er erasureObjects) cleanupDeletedObjects(ctx context.Context) {
|
|
|
|
// run multiple cleanup's local to this server.
|
|
|
|
var wg sync.WaitGroup
|
|
|
|
for _, disk := range er.getLoadBalancedLocalDisks() {
|
|
|
|
if disk != nil {
|
|
|
|
wg.Add(1)
|
|
|
|
go func(disk StorageAPI) {
|
|
|
|
defer wg.Done()
|
|
|
|
diskPath := disk.Endpoint().Path
|
|
|
|
readDirFn(pathJoin(diskPath, minioMetaTmpDeletedBucket), func(ddir string, typ os.FileMode) error {
|
2023-08-14 12:28:13 -07:00
|
|
|
w := xioutil.NewDeadlineWorker(diskMaxTimeout)
|
|
|
|
return w.Run(func() error {
|
|
|
|
wait := deletedCleanupSleeper.Timer(ctx)
|
|
|
|
removeAll(pathJoin(diskPath, minioMetaTmpDeletedBucket, ddir))
|
|
|
|
wait()
|
|
|
|
return nil
|
|
|
|
})
|
2021-02-26 09:52:27 -08:00
|
|
|
})
|
|
|
|
}(disk)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
wg.Wait()
|
|
|
|
}
|
|
|
|
|
2021-02-26 15:11:42 -08:00
|
|
|
// nsScanner will start scanning buckets and send updated totals as they are traversed.
|
2020-06-12 20:04:01 -07:00
|
|
|
// Updates are sent on a regular basis and the caller *must* consume them.
|
2023-02-24 04:33:31 +01:00
|
|
|
func (er erasureObjects) nsScanner(ctx context.Context, buckets []BucketInfo, wantCycle uint32, updates chan<- dataUsageCache, healScanMode madmin.HealScanMode) error {
|
2020-08-25 10:55:15 -07:00
|
|
|
if len(buckets) == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
2020-06-12 20:04:01 -07:00
|
|
|
|
2021-01-19 02:40:52 -08:00
|
|
|
// Collect disks we can use.
|
|
|
|
disks, healing := er.getOnlineDisksWithHealing()
|
2020-08-25 10:55:15 -07:00
|
|
|
if len(disks) == 0 {
|
2022-08-04 16:10:08 -07:00
|
|
|
logger.LogIf(ctx, errors.New("data-scanner: all drives are offline or being healed, skipping scanner cycle"))
|
2020-05-09 18:54:20 +02:00
|
|
|
return nil
|
|
|
|
}
|
2020-06-12 20:04:01 -07:00
|
|
|
|
|
|
|
// Load bucket totals
|
|
|
|
oldCache := dataUsageCache{}
|
2020-09-28 19:39:32 -07:00
|
|
|
if err := oldCache.load(ctx, er, dataUsageCacheName); err != nil {
|
2018-04-05 15:04:40 -07:00
|
|
|
return err
|
2017-08-14 18:08:42 -07:00
|
|
|
}
|
2019-01-17 04:58:18 -08:00
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// New cache..
|
|
|
|
cache := dataUsageCache{
|
|
|
|
Info: dataUsageCacheInfo{
|
|
|
|
Name: dataUsageRoot,
|
|
|
|
NextCycle: oldCache.Info.NextCycle,
|
|
|
|
},
|
|
|
|
Cache: make(map[string]dataUsageEntry, len(oldCache.Cache)),
|
|
|
|
}
|
2019-01-17 04:58:18 -08:00
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// Put all buckets into channel.
|
|
|
|
bucketCh := make(chan BucketInfo, len(buckets))
|
2023-07-14 02:25:40 -07:00
|
|
|
|
|
|
|
// Shuffle buckets to ensure total randomness of buckets, being scanned.
|
|
|
|
// Otherwise same set of buckets get scanned across erasure sets always.
|
|
|
|
// at any given point in time. This allows different buckets to be scanned
|
|
|
|
// in different order per erasure set, this wider spread is needed when
|
|
|
|
// there are lots of buckets with different order of objects in them.
|
|
|
|
r := rand.New(rand.NewSource(time.Now().UnixNano()))
|
|
|
|
permutes := r.Perm(len(buckets))
|
2020-06-12 20:04:01 -07:00
|
|
|
// Add new buckets first
|
2023-07-14 02:25:40 -07:00
|
|
|
for _, idx := range permutes {
|
|
|
|
b := buckets[idx]
|
|
|
|
if e := oldCache.find(b.Name); e == nil {
|
2020-06-12 20:04:01 -07:00
|
|
|
bucketCh <- b
|
|
|
|
}
|
2019-01-17 04:58:18 -08:00
|
|
|
}
|
2023-07-14 02:25:40 -07:00
|
|
|
for _, idx := range permutes {
|
|
|
|
b := buckets[idx]
|
|
|
|
if e := oldCache.find(b.Name); e != nil {
|
2020-06-12 20:04:01 -07:00
|
|
|
cache.replace(b.Name, dataUsageRoot, *e)
|
2020-08-24 13:47:01 -07:00
|
|
|
bucketCh <- b
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
2019-05-01 04:57:31 +05:30
|
|
|
}
|
2020-06-12 20:04:01 -07:00
|
|
|
close(bucketCh)
|
2023-07-14 02:25:40 -07:00
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
bucketResults := make(chan dataUsageEntryInfo, len(disks))
|
|
|
|
|
|
|
|
// Start async collector/saver.
|
|
|
|
// This goroutine owns the cache.
|
|
|
|
var saverWg sync.WaitGroup
|
|
|
|
saverWg.Add(1)
|
|
|
|
go func() {
|
2021-02-18 00:38:37 -08:00
|
|
|
// Add jitter to the update time so multiple sets don't sync up.
|
2022-01-02 09:15:06 -08:00
|
|
|
updateTime := 30*time.Second + time.Duration(float64(10*time.Second)*rand.Float64())
|
2020-06-12 20:04:01 -07:00
|
|
|
t := time.NewTicker(updateTime)
|
|
|
|
defer t.Stop()
|
|
|
|
defer saverWg.Done()
|
|
|
|
var lastSave time.Time
|
|
|
|
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-t.C:
|
|
|
|
if cache.Info.LastUpdate.Equal(lastSave) {
|
|
|
|
continue
|
|
|
|
}
|
2023-06-24 20:29:13 -07:00
|
|
|
logger.LogOnceIf(ctx, cache.save(ctx, er, dataUsageCacheName), "nsscanner-cache-update")
|
2020-06-12 20:04:01 -07:00
|
|
|
updates <- cache.clone()
|
|
|
|
lastSave = cache.Info.LastUpdate
|
|
|
|
case v, ok := <-bucketResults:
|
|
|
|
if !ok {
|
2020-12-26 22:58:06 -08:00
|
|
|
// Save final state...
|
2021-08-25 17:25:26 +02:00
|
|
|
cache.Info.NextCycle = wantCycle
|
2020-12-26 22:58:06 -08:00
|
|
|
cache.Info.LastUpdate = time.Now()
|
2023-06-24 20:29:13 -07:00
|
|
|
logger.LogOnceIf(ctx, cache.save(ctx, er, dataUsageCacheName), "nsscanner-channel-closed")
|
2020-12-26 22:58:06 -08:00
|
|
|
updates <- cache
|
|
|
|
return
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
|
|
|
cache.replace(v.Name, v.Parent, v.Entry)
|
|
|
|
cache.Info.LastUpdate = time.Now()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
|
2022-08-08 16:16:44 -07:00
|
|
|
// Restrict parallelism for disk usage scanner
|
|
|
|
// upto GOMAXPROCS if GOMAXPROCS is < len(disks)
|
|
|
|
maxProcs := runtime.GOMAXPROCS(0)
|
|
|
|
if maxProcs < len(disks) {
|
|
|
|
disks = disks[:maxProcs]
|
|
|
|
}
|
|
|
|
|
2021-02-17 12:04:11 -08:00
|
|
|
// Start one scanner per disk
|
2020-06-12 20:04:01 -07:00
|
|
|
var wg sync.WaitGroup
|
|
|
|
wg.Add(len(disks))
|
2023-03-09 15:15:46 -08:00
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
for i := range disks {
|
|
|
|
go func(i int) {
|
|
|
|
defer wg.Done()
|
|
|
|
disk := disks[i]
|
|
|
|
|
|
|
|
for bucket := range bucketCh {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
|
|
|
default:
|
|
|
|
}
|
|
|
|
|
|
|
|
// Load cache for bucket
|
|
|
|
cacheName := pathJoin(bucket.Name, dataUsageCacheName)
|
|
|
|
cache := dataUsageCache{}
|
|
|
|
logger.LogIf(ctx, cache.load(ctx, er, cacheName))
|
|
|
|
if cache.Info.Name == "" {
|
|
|
|
cache.Info.Name = bucket.Name
|
|
|
|
}
|
2021-01-19 02:40:52 -08:00
|
|
|
cache.Info.SkipHealing = healing
|
2021-08-25 17:25:26 +02:00
|
|
|
cache.Info.NextCycle = wantCycle
|
2020-06-12 20:04:01 -07:00
|
|
|
if cache.Info.Name != bucket.Name {
|
|
|
|
logger.LogIf(ctx, fmt.Errorf("cache name mismatch: %s != %s", cache.Info.Name, bucket.Name))
|
|
|
|
cache.Info = dataUsageCacheInfo{
|
|
|
|
Name: bucket.Name,
|
|
|
|
LastUpdate: time.Time{},
|
2021-08-25 17:25:26 +02:00
|
|
|
NextCycle: wantCycle,
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
|
|
|
}
|
2021-05-19 23:38:30 +02:00
|
|
|
// Collect updates.
|
|
|
|
updates := make(chan dataUsageEntry, 1)
|
|
|
|
var wg sync.WaitGroup
|
|
|
|
wg.Add(1)
|
2021-07-02 11:19:56 -07:00
|
|
|
go func(name string) {
|
2021-05-19 23:38:30 +02:00
|
|
|
defer wg.Done()
|
|
|
|
for update := range updates {
|
2023-03-01 06:34:45 +01:00
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
case bucketResults <- dataUsageEntryInfo{
|
2021-07-02 11:19:56 -07:00
|
|
|
Name: name,
|
2021-05-19 23:38:30 +02:00
|
|
|
Parent: dataUsageRoot,
|
|
|
|
Entry: update,
|
2023-03-01 06:34:45 +01:00
|
|
|
}:
|
2021-05-19 23:38:30 +02:00
|
|
|
}
|
|
|
|
}
|
2021-07-02 11:19:56 -07:00
|
|
|
}(cache.Info.Name)
|
2020-06-12 20:04:01 -07:00
|
|
|
// Calc usage
|
|
|
|
before := cache.Info.LastUpdate
|
2020-09-28 19:39:32 -07:00
|
|
|
var err error
|
2022-04-07 16:10:40 +01:00
|
|
|
cache, err = disk.NSScanner(ctx, cache, updates, healScanMode)
|
2020-06-12 20:04:01 -07:00
|
|
|
if err != nil {
|
2021-02-22 10:04:32 -08:00
|
|
|
if !cache.Info.LastUpdate.IsZero() && cache.Info.LastUpdate.After(before) {
|
2020-06-12 20:04:01 -07:00
|
|
|
logger.LogIf(ctx, cache.save(ctx, er, cacheName))
|
2021-02-22 10:04:32 -08:00
|
|
|
} else {
|
|
|
|
logger.LogIf(ctx, err)
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
2022-01-19 00:46:43 -08:00
|
|
|
// This ensures that we don't close
|
|
|
|
// bucketResults channel while the
|
|
|
|
// updates-collector goroutine still
|
|
|
|
// holds a reference to this.
|
|
|
|
wg.Wait()
|
2020-06-12 20:04:01 -07:00
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
2021-05-19 23:38:30 +02:00
|
|
|
wg.Wait()
|
2020-06-12 20:04:01 -07:00
|
|
|
var root dataUsageEntry
|
|
|
|
if r := cache.root(); r != nil {
|
|
|
|
root = cache.flatten(*r)
|
|
|
|
}
|
2023-03-01 06:34:45 +01:00
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
|
|
|
case bucketResults <- dataUsageEntryInfo{
|
2020-06-12 20:04:01 -07:00
|
|
|
Name: cache.Info.Name,
|
|
|
|
Parent: dataUsageRoot,
|
|
|
|
Entry: root,
|
2023-03-01 06:34:45 +01:00
|
|
|
}:
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
2023-03-09 15:15:46 -08:00
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// Save cache
|
|
|
|
logger.LogIf(ctx, cache.save(ctx, er, cacheName))
|
|
|
|
}
|
|
|
|
}(i)
|
2019-01-17 04:58:18 -08:00
|
|
|
}
|
2020-06-12 20:04:01 -07:00
|
|
|
wg.Wait()
|
|
|
|
close(bucketResults)
|
|
|
|
saverWg.Wait()
|
|
|
|
|
|
|
|
return nil
|
|
|
|
}
|