2016-05-20 20:48:47 -07:00
|
|
|
/*
|
2019-04-09 11:39:42 -07:00
|
|
|
* MinIO Cloud Storage, (C) 2016, 2017, 2018 MinIO, Inc.
|
2016-05-20 20:48:47 -07:00
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
2016-08-18 16:23:42 -07:00
|
|
|
package cmd
|
2016-05-20 20:48:47 -07:00
|
|
|
|
|
|
|
import (
|
2018-03-14 12:01:47 -07:00
|
|
|
"context"
|
2020-03-19 00:19:29 +01:00
|
|
|
"fmt"
|
2016-05-26 14:13:10 -07:00
|
|
|
"sort"
|
2019-12-12 15:02:37 +01:00
|
|
|
"sync"
|
2020-03-19 00:19:29 +01:00
|
|
|
"time"
|
2016-05-26 14:13:10 -07:00
|
|
|
|
2018-04-05 15:04:40 -07:00
|
|
|
"github.com/minio/minio/cmd/logger"
|
2018-02-15 17:45:57 -08:00
|
|
|
"github.com/minio/minio/pkg/bpool"
|
2019-11-13 12:17:45 -08:00
|
|
|
"github.com/minio/minio/pkg/dsync"
|
2019-10-23 09:31:14 +05:30
|
|
|
"github.com/minio/minio/pkg/madmin"
|
2019-10-14 09:44:51 -07:00
|
|
|
"github.com/minio/minio/pkg/sync/errgroup"
|
2016-05-20 20:48:47 -07:00
|
|
|
)
|
|
|
|
|
2016-05-30 16:51:59 -07:00
|
|
|
// XL constants.
|
2016-05-20 20:48:47 -07:00
|
|
|
const (
|
2016-05-30 16:51:59 -07:00
|
|
|
// XL metadata file carries per object metadata.
|
|
|
|
xlMetaJSONFile = "xl.json"
|
2016-05-20 20:48:47 -07:00
|
|
|
)
|
|
|
|
|
2018-08-23 23:35:37 -07:00
|
|
|
// OfflineDisk represents an unavailable disk.
|
|
|
|
var OfflineDisk StorageAPI // zero value is nil
|
|
|
|
|
2020-01-16 03:30:32 +01:00
|
|
|
// partialUpload is a successful upload of an object
|
|
|
|
// but not written in all disks (having quorum)
|
|
|
|
type partialUpload struct {
|
|
|
|
bucket string
|
|
|
|
object string
|
|
|
|
failedSet int
|
|
|
|
}
|
|
|
|
|
2016-05-30 16:51:59 -07:00
|
|
|
// xlObjects - Implements XL object layer.
|
2016-05-20 20:48:47 -07:00
|
|
|
type xlObjects struct {
|
2018-02-15 17:45:57 -08:00
|
|
|
// getDisks returns list of storageAPIs.
|
|
|
|
getDisks func() []StorageAPI
|
2016-05-20 20:48:47 -07:00
|
|
|
|
2019-11-13 12:17:45 -08:00
|
|
|
// getLockers returns list of remote and local lockers.
|
|
|
|
getLockers func() []dsync.NetLocker
|
|
|
|
|
2020-03-04 16:18:32 -08:00
|
|
|
endpoints Endpoints
|
|
|
|
|
2019-11-13 12:17:45 -08:00
|
|
|
// Locker mutex map.
|
|
|
|
nsMutex *nsLockMap
|
|
|
|
|
2018-02-15 17:45:57 -08:00
|
|
|
// Byte pools used for temporary i/o buffers.
|
|
|
|
bp *bpool.BytePoolCap
|
2018-02-12 01:46:12 -08:00
|
|
|
|
2018-02-15 17:45:57 -08:00
|
|
|
// TODO: ListObjects pool management, should be removed in future.
|
2019-04-17 09:52:08 -07:00
|
|
|
listPool *TreeWalkPool
|
2020-01-16 03:30:32 +01:00
|
|
|
|
|
|
|
mrfUploadCh chan partialUpload
|
2017-01-16 17:05:00 -08:00
|
|
|
}
|
|
|
|
|
2019-11-13 12:17:45 -08:00
|
|
|
// NewNSLock - initialize a new namespace RWLocker instance.
|
2020-02-21 11:29:57 +05:30
|
|
|
func (xl xlObjects) NewNSLock(ctx context.Context, bucket string, objects ...string) RWLocker {
|
|
|
|
return xl.nsMutex.NewNSLock(ctx, xl.getLockers, bucket, objects...)
|
2019-11-13 12:17:45 -08:00
|
|
|
}
|
|
|
|
|
2016-08-15 07:55:48 +01:00
|
|
|
// Shutdown function for object storage interface.
|
2018-03-14 12:01:47 -07:00
|
|
|
func (xl xlObjects) Shutdown(ctx context.Context) error {
|
2016-08-15 07:55:48 +01:00
|
|
|
// Add any object layer shutdown activities here.
|
2018-04-03 23:58:48 -05:00
|
|
|
closeStorageDisks(xl.getDisks())
|
2016-08-15 07:55:48 +01:00
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2016-05-26 14:13:10 -07:00
|
|
|
// byDiskTotal is a collection satisfying sort.Interface.
|
2018-05-23 03:11:29 -07:00
|
|
|
type byDiskTotal []DiskInfo
|
2016-05-26 14:13:10 -07:00
|
|
|
|
|
|
|
func (d byDiskTotal) Len() int { return len(d) }
|
|
|
|
func (d byDiskTotal) Swap(i, j int) { d[i], d[j] = d[j], d[i] }
|
|
|
|
func (d byDiskTotal) Less(i, j int) bool {
|
|
|
|
return d[i].Total < d[j].Total
|
|
|
|
}
|
|
|
|
|
2016-10-05 12:48:07 -07:00
|
|
|
// getDisksInfo - fetch disks info across all other storage API.
|
2020-03-04 16:18:32 -08:00
|
|
|
func getDisksInfo(disks []StorageAPI, endpoints Endpoints) (disksInfo []DiskInfo, onlineDisks, offlineDisks madmin.BackendDisks) {
|
2018-05-23 03:11:29 -07:00
|
|
|
disksInfo = make([]DiskInfo, len(disks))
|
2019-10-14 09:44:51 -07:00
|
|
|
|
|
|
|
g := errgroup.WithNErrs(len(disks))
|
|
|
|
for index := range disks {
|
|
|
|
index := index
|
|
|
|
g.Go(func() error {
|
|
|
|
if disks[index] == nil {
|
|
|
|
// Storage disk is empty, perhaps ignored disk or not available.
|
|
|
|
return errDiskNotFound
|
|
|
|
}
|
|
|
|
info, err := disks[index].DiskInfo()
|
2019-08-23 08:32:40 +05:30
|
|
|
if err != nil {
|
|
|
|
if IsErr(err, baseErrs...) {
|
2019-10-14 09:44:51 -07:00
|
|
|
return err
|
2019-08-23 08:32:40 +05:30
|
|
|
}
|
2019-10-14 09:44:51 -07:00
|
|
|
reqInfo := (&logger.ReqInfo{}).AppendTags("disk", disks[index].String())
|
2020-04-09 09:30:02 -07:00
|
|
|
ctx := logger.SetReqInfo(GlobalContext, reqInfo)
|
2019-10-14 09:44:51 -07:00
|
|
|
logger.LogIf(ctx, err)
|
2016-10-05 12:48:07 -07:00
|
|
|
}
|
2019-10-14 09:44:51 -07:00
|
|
|
disksInfo[index] = info
|
|
|
|
return nil
|
|
|
|
}, index)
|
2016-05-26 14:13:10 -07:00
|
|
|
}
|
2019-08-23 17:03:15 -07:00
|
|
|
|
2019-10-23 09:31:14 +05:30
|
|
|
onlineDisks = make(madmin.BackendDisks)
|
|
|
|
offlineDisks = make(madmin.BackendDisks)
|
2020-02-20 04:51:33 +01:00
|
|
|
|
2019-10-23 09:31:14 +05:30
|
|
|
// Wait for the routines.
|
2020-02-20 04:51:33 +01:00
|
|
|
for i, diskInfoErr := range g.Wait() {
|
2020-03-04 16:18:32 -08:00
|
|
|
peerAddr := endpoints[i].Host
|
2019-10-23 09:31:14 +05:30
|
|
|
if _, ok := offlineDisks[peerAddr]; !ok {
|
|
|
|
offlineDisks[peerAddr] = 0
|
|
|
|
}
|
|
|
|
if _, ok := onlineDisks[peerAddr]; !ok {
|
|
|
|
onlineDisks[peerAddr] = 0
|
|
|
|
}
|
2020-03-04 16:18:32 -08:00
|
|
|
if disks[i] == nil || diskInfoErr != nil {
|
2019-10-23 09:31:14 +05:30
|
|
|
offlineDisks[peerAddr]++
|
2019-10-31 21:43:54 +05:30
|
|
|
continue
|
2019-10-23 09:31:14 +05:30
|
|
|
}
|
|
|
|
onlineDisks[peerAddr]++
|
2019-08-23 17:03:15 -07:00
|
|
|
}
|
|
|
|
|
2016-10-05 12:48:07 -07:00
|
|
|
// Success.
|
|
|
|
return disksInfo, onlineDisks, offlineDisks
|
|
|
|
}
|
|
|
|
|
|
|
|
// Get an aggregated storage info across all disks.
|
2020-03-04 16:18:32 -08:00
|
|
|
func getStorageInfo(disks []StorageAPI, endpoints Endpoints) StorageInfo {
|
|
|
|
disksInfo, onlineDisks, offlineDisks := getDisksInfo(disks, endpoints)
|
2016-10-17 14:31:33 -07:00
|
|
|
|
|
|
|
// Sort so that the first element is the smallest.
|
2020-01-10 02:35:06 -08:00
|
|
|
sort.Sort(byDiskTotal(disksInfo))
|
2016-10-17 14:31:33 -07:00
|
|
|
|
2019-04-04 21:21:50 -07:00
|
|
|
// Combine all disks to get total usage
|
2020-01-10 02:35:06 -08:00
|
|
|
usedList := make([]uint64, len(disksInfo))
|
|
|
|
totalList := make([]uint64, len(disksInfo))
|
|
|
|
availableList := make([]uint64, len(disksInfo))
|
|
|
|
mountPaths := make([]string, len(disksInfo))
|
2019-10-23 09:31:14 +05:30
|
|
|
|
2020-01-10 02:35:06 -08:00
|
|
|
for i, di := range disksInfo {
|
2019-10-23 09:31:14 +05:30
|
|
|
usedList[i] = di.Used
|
|
|
|
totalList[i] = di.Total
|
|
|
|
availableList[i] = di.Free
|
2020-02-20 04:51:33 +01:00
|
|
|
mountPaths[i] = di.MountPath
|
2018-05-23 03:11:29 -07:00
|
|
|
}
|
|
|
|
|
2019-02-13 04:59:36 -08:00
|
|
|
storageInfo := StorageInfo{
|
2019-10-23 09:31:14 +05:30
|
|
|
Used: usedList,
|
|
|
|
Total: totalList,
|
|
|
|
Available: availableList,
|
|
|
|
MountPaths: mountPaths,
|
2019-02-13 04:59:36 -08:00
|
|
|
}
|
2019-04-04 21:21:50 -07:00
|
|
|
|
2018-08-23 23:35:37 -07:00
|
|
|
storageInfo.Backend.Type = BackendErasure
|
2016-10-05 12:48:07 -07:00
|
|
|
storageInfo.Backend.OnlineDisks = onlineDisks
|
|
|
|
storageInfo.Backend.OfflineDisks = offlineDisks
|
2017-12-22 16:58:13 +05:30
|
|
|
|
2016-10-05 12:48:07 -07:00
|
|
|
return storageInfo
|
|
|
|
}
|
|
|
|
|
|
|
|
// StorageInfo - returns underlying storage statistics.
|
2020-02-20 04:51:33 +01:00
|
|
|
func (xl xlObjects) StorageInfo(ctx context.Context, local bool) StorageInfo {
|
2020-03-04 16:18:32 -08:00
|
|
|
var endpoints = xl.endpoints
|
2020-02-20 04:51:33 +01:00
|
|
|
var disks []StorageAPI
|
2020-03-04 16:18:32 -08:00
|
|
|
|
2020-02-20 04:51:33 +01:00
|
|
|
if !local {
|
|
|
|
disks = xl.getDisks()
|
|
|
|
} else {
|
2020-03-04 16:18:32 -08:00
|
|
|
for i, d := range xl.getDisks() {
|
2020-03-27 14:48:30 -07:00
|
|
|
if endpoints[i].IsLocal && d.Hostname() == "" {
|
2020-02-20 04:51:33 +01:00
|
|
|
// Append this local disk since local flag is true
|
|
|
|
disks = append(disks, d)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2020-03-04 16:18:32 -08:00
|
|
|
return getStorageInfo(disks, endpoints)
|
2016-05-26 14:13:10 -07:00
|
|
|
}
|
2019-12-06 12:46:06 +05:30
|
|
|
|
2020-01-21 14:07:49 -08:00
|
|
|
// GetMetrics - is not implemented and shouldn't be called.
|
2019-12-06 12:46:06 +05:30
|
|
|
func (xl xlObjects) GetMetrics(ctx context.Context) (*Metrics, error) {
|
|
|
|
logger.LogIf(ctx, NotImplemented{})
|
|
|
|
return &Metrics{}, NotImplemented{}
|
|
|
|
}
|
2019-12-12 15:02:37 +01:00
|
|
|
|
2020-03-19 00:19:29 +01:00
|
|
|
// CrawlAndGetDataUsage will start crawling buckets and send updated totals as they are traversed.
|
|
|
|
// Updates are sent on a regular basis and the caller *must* consume them.
|
|
|
|
func (xl xlObjects) CrawlAndGetDataUsage(ctx context.Context, updates chan<- DataUsageInfo) error {
|
|
|
|
cache := make(chan dataUsageCache, 1)
|
|
|
|
defer close(cache)
|
|
|
|
buckets, err := xl.ListBuckets(ctx)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
go func() {
|
|
|
|
for update := range cache {
|
|
|
|
updates <- update.dui(update.Info.Name, buckets)
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
return xl.crawlAndGetDataUsage(ctx, buckets, cache)
|
|
|
|
}
|
|
|
|
|
|
|
|
// CrawlAndGetDataUsage will start crawling buckets and send updated totals as they are traversed.
|
|
|
|
// Updates are sent on a regular basis and the caller *must* consume them.
|
|
|
|
func (xl xlObjects) crawlAndGetDataUsage(ctx context.Context, buckets []BucketInfo, updates chan<- dataUsageCache) error {
|
|
|
|
var disks []StorageAPI
|
|
|
|
|
2019-12-12 15:02:37 +01:00
|
|
|
for _, d := range xl.getLoadBalancedDisks() {
|
|
|
|
if d == nil || !d.IsOnline() {
|
|
|
|
continue
|
|
|
|
}
|
2020-03-19 00:19:29 +01:00
|
|
|
disks = append(disks, d)
|
|
|
|
}
|
|
|
|
if len(disks) == 0 || len(buckets) == 0 {
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// Load bucket totals
|
|
|
|
oldCache := dataUsageCache{}
|
|
|
|
err := oldCache.load(ctx, xl, dataUsageCacheName)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
2019-12-12 15:02:37 +01:00
|
|
|
}
|
|
|
|
|
2020-03-19 00:19:29 +01:00
|
|
|
// New cache..
|
|
|
|
cache := dataUsageCache{
|
|
|
|
Info: dataUsageCacheInfo{
|
|
|
|
Name: dataUsageRoot,
|
|
|
|
NextCycle: oldCache.Info.NextCycle,
|
|
|
|
},
|
|
|
|
Cache: make(map[dataUsageHash]dataUsageEntry, len(oldCache.Cache)),
|
|
|
|
}
|
2019-12-12 15:02:37 +01:00
|
|
|
|
2020-03-19 00:19:29 +01:00
|
|
|
// Put all buckets into channel.
|
|
|
|
bucketCh := make(chan BucketInfo, len(buckets))
|
|
|
|
// Add new buckets first
|
|
|
|
for _, b := range buckets {
|
|
|
|
if oldCache.find(b.Name) == nil {
|
|
|
|
bucketCh <- b
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// Add existing buckets.
|
|
|
|
for _, b := range buckets {
|
|
|
|
e := oldCache.find(b.Name)
|
|
|
|
if e != nil {
|
|
|
|
bucketCh <- b
|
|
|
|
cache.replace(b.Name, dataUsageRoot, *e)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
close(bucketCh)
|
|
|
|
buckets = nil
|
|
|
|
bucketResults := make(chan dataUsageEntryInfo, len(disks))
|
|
|
|
|
|
|
|
// Start async collector/saver.
|
|
|
|
// This goroutine owns the cache.
|
|
|
|
var saverWg sync.WaitGroup
|
|
|
|
saverWg.Add(1)
|
|
|
|
go func() {
|
|
|
|
const updateTime = 30 * time.Second
|
|
|
|
t := time.NewTicker(updateTime)
|
|
|
|
defer t.Stop()
|
|
|
|
defer saverWg.Done()
|
|
|
|
var lastSave time.Time
|
|
|
|
|
|
|
|
saveLoop:
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
// Return without saving.
|
|
|
|
return
|
|
|
|
case <-t.C:
|
|
|
|
if cache.Info.LastUpdate.Equal(lastSave) {
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
logger.LogIf(ctx, cache.save(ctx, xl, dataUsageCacheName))
|
|
|
|
updates <- cache.clone()
|
|
|
|
lastSave = cache.Info.LastUpdate
|
|
|
|
case v, ok := <-bucketResults:
|
|
|
|
if !ok {
|
|
|
|
break saveLoop
|
|
|
|
}
|
|
|
|
cache.replace(v.Name, v.Parent, v.Entry)
|
|
|
|
cache.Info.LastUpdate = time.Now()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// Save final state...
|
|
|
|
cache.Info.NextCycle++
|
|
|
|
cache.Info.LastUpdate = time.Now()
|
|
|
|
logger.LogIf(ctx, cache.save(ctx, xl, dataUsageCacheName))
|
|
|
|
updates <- cache
|
|
|
|
}()
|
|
|
|
|
|
|
|
// Start one crawler per disk
|
2019-12-12 15:02:37 +01:00
|
|
|
var wg sync.WaitGroup
|
2020-03-19 00:19:29 +01:00
|
|
|
wg.Add(len(disks))
|
|
|
|
for i := range disks {
|
|
|
|
go func(i int) {
|
2019-12-12 15:02:37 +01:00
|
|
|
defer wg.Done()
|
2020-03-19 00:19:29 +01:00
|
|
|
disk := disks[i]
|
|
|
|
|
|
|
|
for bucket := range bucketCh {
|
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
|
|
|
return
|
|
|
|
default:
|
|
|
|
}
|
2020-03-19 09:47:47 -07:00
|
|
|
|
2020-03-19 00:19:29 +01:00
|
|
|
// Load cache for bucket
|
2020-03-19 09:47:47 -07:00
|
|
|
cacheName := pathJoin(bucket.Name, dataUsageCacheName)
|
2020-03-19 00:19:29 +01:00
|
|
|
cache := dataUsageCache{}
|
|
|
|
logger.LogIf(ctx, cache.load(ctx, xl, cacheName))
|
|
|
|
if cache.Info.Name == "" {
|
|
|
|
cache.Info.Name = bucket.Name
|
|
|
|
}
|
|
|
|
if cache.Info.Name != bucket.Name {
|
|
|
|
logger.LogIf(ctx, fmt.Errorf("cache name mismatch: %s != %s", cache.Info.Name, bucket.Name))
|
|
|
|
cache.Info = dataUsageCacheInfo{
|
|
|
|
Name: bucket.Name,
|
|
|
|
LastUpdate: time.Time{},
|
|
|
|
NextCycle: 0,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Calc usage
|
|
|
|
before := cache.Info.LastUpdate
|
|
|
|
cache, err = disk.CrawlAndGetDataUsage(ctx, cache)
|
|
|
|
if err != nil {
|
|
|
|
logger.LogIf(ctx, err)
|
|
|
|
if cache.Info.LastUpdate.After(before) {
|
|
|
|
logger.LogIf(ctx, cache.save(ctx, xl, cacheName))
|
|
|
|
}
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
|
|
|
|
var root dataUsageEntry
|
|
|
|
if r := cache.root(); r != nil {
|
|
|
|
root = cache.flatten(*r)
|
|
|
|
}
|
|
|
|
bucketResults <- dataUsageEntryInfo{
|
|
|
|
Name: cache.Info.Name,
|
|
|
|
Parent: dataUsageRoot,
|
|
|
|
Entry: root,
|
|
|
|
}
|
|
|
|
// Save cache
|
|
|
|
logger.LogIf(ctx, cache.save(ctx, xl, cacheName))
|
2019-12-12 15:02:37 +01:00
|
|
|
}
|
2020-03-19 00:19:29 +01:00
|
|
|
}(i)
|
2019-12-12 15:02:37 +01:00
|
|
|
}
|
|
|
|
wg.Wait()
|
2020-03-19 00:19:29 +01:00
|
|
|
close(bucketResults)
|
|
|
|
saverWg.Wait()
|
2019-12-12 15:02:37 +01:00
|
|
|
|
2020-03-19 00:19:29 +01:00
|
|
|
return nil
|
2019-12-12 15:02:37 +01:00
|
|
|
}
|
2019-12-28 22:24:43 +05:30
|
|
|
|
|
|
|
// IsReady - No Op.
|
|
|
|
func (xl xlObjects) IsReady(ctx context.Context) bool {
|
|
|
|
logger.CriticalIf(ctx, NotImplemented{})
|
|
|
|
return true
|
|
|
|
}
|