2016-05-06 01:21:56 +05:30
|
|
|
/*
|
|
|
|
* Minio Cloud Storage, (C) 2016 Minio, Inc.
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
2016-05-20 20:48:47 -07:00
|
|
|
"math/rand"
|
2016-05-06 01:21:56 +05:30
|
|
|
"path"
|
|
|
|
"sort"
|
|
|
|
"strings"
|
|
|
|
"time"
|
|
|
|
)
|
|
|
|
|
|
|
|
// listParams - list object params used for list object map
|
|
|
|
type listParams struct {
|
|
|
|
bucket string
|
|
|
|
recursive bool
|
|
|
|
marker string
|
|
|
|
prefix string
|
|
|
|
}
|
|
|
|
|
|
|
|
// Tree walk result carries results of tree walking.
|
|
|
|
type treeWalkResult struct {
|
2016-05-20 20:48:47 -07:00
|
|
|
objInfo ObjectInfo
|
|
|
|
err error
|
|
|
|
end bool
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
// Tree walk notify carries a channel which notifies tree walk
|
|
|
|
// results, additionally it also carries information if treeWalk
|
|
|
|
// should be timedOut.
|
|
|
|
type treeWalker struct {
|
|
|
|
ch <-chan treeWalkResult
|
|
|
|
timedOut bool
|
|
|
|
}
|
|
|
|
|
2016-05-20 20:48:47 -07:00
|
|
|
// listDir - listDir.
|
|
|
|
func (xl xlObjects) listDir(bucket, prefixDir string, filter func(entry string) bool) (entries []string, err error) {
|
|
|
|
// Count for list errors encountered.
|
|
|
|
var listErrCount = 0
|
|
|
|
|
2016-05-24 17:48:58 -07:00
|
|
|
// Return the first success entry based on the selected random disk.
|
2016-05-20 20:48:47 -07:00
|
|
|
for listErrCount < len(xl.storageDisks) {
|
|
|
|
// Choose a random disk on each attempt, do not hit the same disk all the time.
|
|
|
|
randIndex := rand.Intn(len(xl.storageDisks) - 1)
|
|
|
|
disk := xl.storageDisks[randIndex] // Pick a random disk.
|
|
|
|
if entries, err = disk.ListDir(bucket, prefixDir); err == nil {
|
|
|
|
// Skip the entries which do not match the filter.
|
|
|
|
for i, entry := range entries {
|
|
|
|
if filter(entry) {
|
|
|
|
entries[i] = ""
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if strings.HasSuffix(entry, slashSeparator) && xl.isObject(bucket, path.Join(prefixDir, entry)) {
|
|
|
|
entries[i] = strings.TrimSuffix(entry, slashSeparator)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
sort.Strings(entries)
|
|
|
|
// Skip the empty strings
|
|
|
|
for len(entries) > 0 && entries[0] == "" {
|
|
|
|
entries = entries[1:]
|
|
|
|
}
|
|
|
|
return entries, nil
|
|
|
|
}
|
|
|
|
listErrCount++ // Update list error count.
|
|
|
|
}
|
|
|
|
|
|
|
|
// Return error at the end.
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
|
|
|
|
// getRandomDisk - gives a random disk at any point in time from the
|
2016-05-24 17:48:58 -07:00
|
|
|
// available pool of disks.
|
2016-05-20 20:48:47 -07:00
|
|
|
func (xl xlObjects) getRandomDisk() (disk StorageAPI) {
|
|
|
|
randIndex := rand.Intn(len(xl.storageDisks) - 1)
|
|
|
|
disk = xl.storageDisks[randIndex] // Pick a random disk.
|
|
|
|
return disk
|
|
|
|
}
|
|
|
|
|
|
|
|
// treeWalkXL walks directory tree recursively pushing fileInfo into the channel as and when it encounters files.
|
|
|
|
func (xl xlObjects) treeWalkXL(bucket, prefixDir, entryPrefixMatch, marker string, recursive bool, send func(treeWalkResult) bool, count *int) bool {
|
2016-05-06 01:21:56 +05:30
|
|
|
// Example:
|
|
|
|
// if prefixDir="one/two/three/" and marker="four/five.txt" treeWalk is recursively
|
|
|
|
// called with prefixDir="one/two/three/four/" and marker="five.txt"
|
|
|
|
|
|
|
|
// Convert entry to FileInfo
|
2016-05-20 20:48:47 -07:00
|
|
|
entryToObjectInfo := func(entry string) (objInfo ObjectInfo, err error) {
|
2016-05-06 01:21:56 +05:30
|
|
|
if strings.HasSuffix(entry, slashSeparator) {
|
|
|
|
// Object name needs to be full path.
|
2016-05-20 20:48:47 -07:00
|
|
|
objInfo.Bucket = bucket
|
|
|
|
objInfo.Name = path.Join(prefixDir, entry)
|
|
|
|
objInfo.Name += slashSeparator
|
|
|
|
objInfo.IsDir = true
|
|
|
|
return objInfo, nil
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
2016-05-20 20:48:47 -07:00
|
|
|
// Set the Mode to a "regular" file.
|
|
|
|
return xl.getObjectInfo(bucket, path.Join(prefixDir, entry))
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
var markerBase, markerDir string
|
|
|
|
if marker != "" {
|
|
|
|
// Ex: if marker="four/five.txt", markerDir="four/" markerBase="five.txt"
|
|
|
|
markerSplit := strings.SplitN(marker, slashSeparator, 2)
|
|
|
|
markerDir = markerSplit[0]
|
|
|
|
if len(markerSplit) == 2 {
|
|
|
|
markerDir += slashSeparator
|
|
|
|
markerBase = markerSplit[1]
|
|
|
|
}
|
|
|
|
}
|
2016-05-20 20:48:47 -07:00
|
|
|
entries, err := xl.listDir(bucket, prefixDir, func(entry string) bool {
|
|
|
|
return !strings.HasPrefix(entry, entryPrefixMatch)
|
|
|
|
})
|
2016-05-06 01:21:56 +05:30
|
|
|
if err != nil {
|
|
|
|
send(treeWalkResult{err: err})
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if len(entries) == 0 {
|
|
|
|
return true
|
|
|
|
}
|
2016-05-20 20:48:47 -07:00
|
|
|
|
2016-05-06 01:21:56 +05:30
|
|
|
// example:
|
|
|
|
// If markerDir="four/" Search() returns the index of "four/" in the sorted
|
|
|
|
// entries list so we skip all the entries till "four/"
|
2016-05-07 02:08:03 -07:00
|
|
|
idx := sort.Search(len(entries), func(i int) bool {
|
2016-05-20 20:48:47 -07:00
|
|
|
return entries[i] >= markerDir
|
2016-05-07 02:08:03 -07:00
|
|
|
})
|
2016-05-06 01:21:56 +05:30
|
|
|
entries = entries[idx:]
|
|
|
|
*count += len(entries)
|
|
|
|
for i, entry := range entries {
|
|
|
|
if i == 0 && markerDir == entry {
|
|
|
|
if !recursive {
|
|
|
|
// Skip as the marker would already be listed in the previous listing.
|
|
|
|
*count--
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if recursive && !strings.HasSuffix(entry, slashSeparator) {
|
|
|
|
// We should not skip for recursive listing and if markerDir is a directory
|
|
|
|
// for ex. if marker is "four/five.txt" markerDir will be "four/" which
|
2016-05-20 20:48:47 -07:00
|
|
|
// should not be skipped, instead it will need to be treeWalkXL()'ed into.
|
2016-05-06 01:21:56 +05:30
|
|
|
|
|
|
|
// Skip if it is a file though as it would be listed in previous listing.
|
|
|
|
*count--
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if recursive && strings.HasSuffix(entry, slashSeparator) {
|
|
|
|
// If the entry is a directory, we will need recurse into it.
|
|
|
|
markerArg := ""
|
|
|
|
if entry == markerDir {
|
|
|
|
// We need to pass "five.txt" as marker only if we are
|
|
|
|
// recursing into "four/"
|
|
|
|
markerArg = markerBase
|
|
|
|
}
|
|
|
|
*count--
|
|
|
|
prefixMatch := "" // Valid only for first level treeWalk and empty for subdirectories.
|
2016-05-20 20:48:47 -07:00
|
|
|
if !xl.treeWalkXL(bucket, path.Join(prefixDir, entry), prefixMatch, markerArg, recursive, send, count) {
|
2016-05-06 01:21:56 +05:30
|
|
|
return false
|
|
|
|
}
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
*count--
|
2016-05-20 20:48:47 -07:00
|
|
|
objInfo, err := entryToObjectInfo(entry)
|
2016-05-06 01:21:56 +05:30
|
|
|
if err != nil {
|
|
|
|
// The file got deleted in the interim between ListDir() and StatFile()
|
|
|
|
// Ignore error and continue.
|
|
|
|
continue
|
|
|
|
}
|
2016-05-20 20:48:47 -07:00
|
|
|
if !send(treeWalkResult{objInfo: objInfo}) {
|
2016-05-06 01:21:56 +05:30
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
// Initiate a new treeWalk in a goroutine.
|
2016-05-20 20:48:47 -07:00
|
|
|
func (xl xlObjects) startTreeWalkXL(bucket, prefix, marker string, recursive bool) *treeWalker {
|
2016-05-06 01:21:56 +05:30
|
|
|
// Example 1
|
|
|
|
// If prefix is "one/two/three/" and marker is "one/two/three/four/five.txt"
|
|
|
|
// treeWalk is called with prefixDir="one/two/three/" and marker="four/five.txt"
|
|
|
|
// and entryPrefixMatch=""
|
|
|
|
|
|
|
|
// Example 2
|
|
|
|
// if prefix is "one/two/th" and marker is "one/two/three/four/five.txt"
|
|
|
|
// treeWalk is called with prefixDir="one/two/" and marker="three/four/five.txt"
|
|
|
|
// and entryPrefixMatch="th"
|
|
|
|
|
|
|
|
ch := make(chan treeWalkResult, maxObjectList)
|
|
|
|
walkNotify := treeWalker{ch: ch}
|
|
|
|
entryPrefixMatch := prefix
|
|
|
|
prefixDir := ""
|
|
|
|
lastIndex := strings.LastIndex(prefix, slashSeparator)
|
|
|
|
if lastIndex != -1 {
|
|
|
|
entryPrefixMatch = prefix[lastIndex+1:]
|
|
|
|
prefixDir = prefix[:lastIndex+1]
|
|
|
|
}
|
|
|
|
count := 0
|
|
|
|
marker = strings.TrimPrefix(marker, prefixDir)
|
|
|
|
go func() {
|
|
|
|
defer close(ch)
|
|
|
|
send := func(walkResult treeWalkResult) bool {
|
|
|
|
if count == 0 {
|
|
|
|
walkResult.end = true
|
|
|
|
}
|
|
|
|
timer := time.After(time.Second * 60)
|
|
|
|
select {
|
|
|
|
case ch <- walkResult:
|
|
|
|
return true
|
|
|
|
case <-timer:
|
|
|
|
walkNotify.timedOut = true
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
2016-05-20 20:48:47 -07:00
|
|
|
xl.treeWalkXL(bucket, prefixDir, entryPrefixMatch, marker, recursive, send, &count)
|
2016-05-06 01:21:56 +05:30
|
|
|
}()
|
|
|
|
return &walkNotify
|
|
|
|
}
|
|
|
|
|
|
|
|
// Save the goroutine reference in the map
|
2016-05-20 20:48:47 -07:00
|
|
|
func (xl xlObjects) saveTreeWalkXL(params listParams, walker *treeWalker) {
|
|
|
|
xl.listObjectMapMutex.Lock()
|
|
|
|
defer xl.listObjectMapMutex.Unlock()
|
2016-05-06 01:21:56 +05:30
|
|
|
|
2016-05-20 20:48:47 -07:00
|
|
|
walkers, _ := xl.listObjectMap[params]
|
2016-05-06 01:21:56 +05:30
|
|
|
walkers = append(walkers, walker)
|
|
|
|
|
2016-05-20 20:48:47 -07:00
|
|
|
xl.listObjectMap[params] = walkers
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
// Lookup the goroutine reference from map
|
2016-05-20 20:48:47 -07:00
|
|
|
func (xl xlObjects) lookupTreeWalkXL(params listParams) *treeWalker {
|
|
|
|
xl.listObjectMapMutex.Lock()
|
|
|
|
defer xl.listObjectMapMutex.Unlock()
|
2016-05-06 01:21:56 +05:30
|
|
|
|
2016-05-20 20:48:47 -07:00
|
|
|
if walkChs, ok := xl.listObjectMap[params]; ok {
|
2016-05-06 01:21:56 +05:30
|
|
|
for i, walkCh := range walkChs {
|
|
|
|
if !walkCh.timedOut {
|
|
|
|
newWalkChs := walkChs[i+1:]
|
|
|
|
if len(newWalkChs) > 0 {
|
2016-05-20 20:48:47 -07:00
|
|
|
xl.listObjectMap[params] = newWalkChs
|
2016-05-06 01:21:56 +05:30
|
|
|
} else {
|
2016-05-20 20:48:47 -07:00
|
|
|
delete(xl.listObjectMap, params)
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
|
|
|
return walkCh
|
|
|
|
}
|
|
|
|
}
|
|
|
|
// As all channels are timed out, delete the map entry
|
2016-05-20 20:48:47 -07:00
|
|
|
delete(xl.listObjectMap, params)
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|