2016-05-06 01:21:56 +05:30
|
|
|
/*
|
|
|
|
* Minio Cloud Storage, (C) 2016 Minio, Inc.
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"sort"
|
|
|
|
"strings"
|
|
|
|
)
|
|
|
|
|
2016-07-07 22:10:27 -07:00
|
|
|
// list of all errors that can be ignored in tree walk operation.
|
|
|
|
var walkResultIgnoredErrs = []error{
|
|
|
|
errFileNotFound,
|
|
|
|
errVolumeNotFound,
|
|
|
|
errDiskNotFound,
|
|
|
|
errDiskAccessDenied,
|
|
|
|
errFaultyDisk,
|
|
|
|
}
|
|
|
|
|
2016-05-06 01:21:56 +05:30
|
|
|
// Tree walk result carries results of tree walking.
|
2016-06-06 00:25:45 +05:30
|
|
|
type treeWalkResult struct {
|
2016-05-25 21:52:39 +05:30
|
|
|
entry string
|
|
|
|
err error
|
|
|
|
end bool
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
|
|
|
|
2016-07-18 03:46:52 +05:30
|
|
|
// posix.ListDir returns entries with trailing "/" for directories. At the object layer
|
|
|
|
// we need to remove this trailing "/" for objects and retain "/" for prefixes before
|
|
|
|
// sorting because the trailing "/" can affect the sorting results for certain cases.
|
|
|
|
// Ex. lets say entries = ["a-b/", "a/"] and both are objects.
|
|
|
|
// sorting with out trailing "/" = ["a", "a-b"]
|
|
|
|
// sorting with trailing "/" = ["a-b/", "a/"]
|
|
|
|
// Hence if entries[] does not have a case like the above example then isLeaf() check
|
|
|
|
// can be delayed till the entry is pushed into the treeWalkResult channel.
|
|
|
|
// delayIsLeafCheck() returns true if isLeaf can be delayed or false if
|
|
|
|
// isLeaf should be done in listDir()
|
|
|
|
func delayIsLeafCheck(entries []string) bool {
|
|
|
|
for i, entry := range entries {
|
|
|
|
if i == len(entries)-1 {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
// If any byte in the "entry" string is less than '/' then the
|
|
|
|
// next "entry" should not contain '/' at the same same byte position.
|
|
|
|
for j := 0; j < len(entry); j++ {
|
|
|
|
if entry[j] < '/' {
|
|
|
|
if len(entries[i+1]) > j {
|
|
|
|
if entries[i+1][j] == '/' {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
// Return entries that have prefix prefixEntry.
|
|
|
|
// Note: input entries are expected to be sorted.
|
|
|
|
func filterMatchingPrefix(entries []string, prefixEntry string) []string {
|
|
|
|
start := 0
|
|
|
|
end := len(entries)
|
|
|
|
for {
|
|
|
|
if start == end {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
if strings.HasPrefix(entries[start], prefixEntry) {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
start++
|
|
|
|
}
|
|
|
|
for {
|
|
|
|
if start == end {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
if strings.HasPrefix(entries[end-1], prefixEntry) {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
end--
|
|
|
|
}
|
|
|
|
return entries[start:end]
|
|
|
|
}
|
|
|
|
|
2016-07-04 14:19:27 +05:30
|
|
|
// "listDir" function of type listDirFunc returned by listDirFactory() - explained below.
|
2016-07-18 03:46:52 +05:30
|
|
|
type listDirFunc func(bucket, prefixDir, prefixEntry string) (entries []string, delayIsLeaf bool, err error)
|
|
|
|
|
|
|
|
// A function isLeaf of type isLeafFunc is used to detect if an entry is a leaf entry. There are four scenarios
|
|
|
|
// where isLeaf should behave differently:
|
|
|
|
// 1. FS backend object listing - isLeaf is true if the entry has a trailing "/"
|
|
|
|
// 2. FS backend multipart listing - isLeaf is true if the entry is a directory and contains uploads.json
|
|
|
|
// 3. XL backend object listing - isLeaf is true if the entry is a directory and contains xl.json
|
|
|
|
// 4. XL backend multipart listing - isLeaf is true if the entry is a directory and contains uploads.json
|
|
|
|
type isLeafFunc func(string, string) bool
|
2016-07-04 14:19:27 +05:30
|
|
|
|
|
|
|
// Returns function "listDir" of the type listDirFunc.
|
|
|
|
// isLeaf - is used by listDir function to check if an entry is a leaf or non-leaf entry.
|
|
|
|
// disks - used for doing disk.ListDir(). FS passes single disk argument, XL passes a list of disks.
|
2016-07-18 03:46:52 +05:30
|
|
|
func listDirFactory(isLeaf isLeafFunc, disks ...StorageAPI) listDirFunc {
|
2016-07-04 14:19:27 +05:30
|
|
|
// listDir - lists all the entries at a given prefix and given entry in the prefix.
|
2016-07-18 03:46:52 +05:30
|
|
|
listDir := func(bucket, prefixDir, prefixEntry string) (entries []string, delayIsLeaf bool, err error) {
|
2016-07-04 14:19:27 +05:30
|
|
|
for _, disk := range disks {
|
|
|
|
if disk == nil {
|
2016-06-02 22:49:27 -07:00
|
|
|
continue
|
|
|
|
}
|
2016-07-04 14:19:27 +05:30
|
|
|
entries, err = disk.ListDir(bucket, prefixDir)
|
2016-07-07 22:10:27 -07:00
|
|
|
if err == nil {
|
2016-07-18 03:46:52 +05:30
|
|
|
// Listing needs to be sorted.
|
|
|
|
sort.Strings(entries)
|
|
|
|
|
|
|
|
// Filter entries that have the prefix prefixEntry.
|
|
|
|
entries = filterMatchingPrefix(entries, prefixEntry)
|
|
|
|
|
|
|
|
// Can isLeaf() check be delayed till when it has to be sent down the
|
|
|
|
// treeWalkResult channel?
|
|
|
|
delayIsLeaf = delayIsLeafCheck(entries)
|
|
|
|
if delayIsLeaf {
|
|
|
|
return entries, delayIsLeaf, nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// isLeaf() check has to happen here so that trailing "/" for objects can be removed.
|
2016-07-07 22:10:27 -07:00
|
|
|
for i, entry := range entries {
|
|
|
|
if isLeaf(bucket, pathJoin(prefixDir, entry)) {
|
|
|
|
entries[i] = strings.TrimSuffix(entry, slashSeparator)
|
|
|
|
}
|
2016-07-04 14:19:27 +05:30
|
|
|
}
|
2016-07-18 03:46:52 +05:30
|
|
|
// Sort again after removing trailing "/" for objects as the previous sort
|
|
|
|
// does not hold good anymore.
|
2016-07-07 22:10:27 -07:00
|
|
|
sort.Strings(entries)
|
2016-07-18 03:46:52 +05:30
|
|
|
return entries, delayIsLeaf, nil
|
2016-05-20 20:48:47 -07:00
|
|
|
}
|
2016-07-07 22:10:27 -07:00
|
|
|
// For any reason disk was deleted or goes offline, continue
|
|
|
|
// and list from other disks if possible.
|
|
|
|
if isErrIgnored(err, walkResultIgnoredErrs) {
|
|
|
|
continue
|
2016-07-04 14:19:27 +05:30
|
|
|
}
|
2016-07-07 22:10:27 -07:00
|
|
|
break
|
2016-05-20 20:48:47 -07:00
|
|
|
}
|
2016-07-04 14:19:27 +05:30
|
|
|
// Return error at the end.
|
2016-07-18 03:46:52 +05:30
|
|
|
return nil, false, err
|
2016-07-04 14:19:27 +05:30
|
|
|
}
|
|
|
|
return listDir
|
2016-05-20 20:48:47 -07:00
|
|
|
}
|
|
|
|
|
2016-07-04 14:19:27 +05:30
|
|
|
// treeWalk walks directory tree recursively pushing treeWalkResult into the channel as and when it encounters files.
|
2016-07-18 03:46:52 +05:30
|
|
|
func doTreeWalk(bucket, prefixDir, entryPrefixMatch, marker string, recursive bool, listDir listDirFunc, isLeaf isLeafFunc, resultCh chan treeWalkResult, endWalkCh chan struct{}, isEnd bool) error {
|
2016-05-06 01:21:56 +05:30
|
|
|
// Example:
|
|
|
|
// if prefixDir="one/two/three/" and marker="four/five.txt" treeWalk is recursively
|
|
|
|
// called with prefixDir="one/two/three/four/" and marker="five.txt"
|
|
|
|
|
|
|
|
var markerBase, markerDir string
|
|
|
|
if marker != "" {
|
|
|
|
// Ex: if marker="four/five.txt", markerDir="four/" markerBase="five.txt"
|
|
|
|
markerSplit := strings.SplitN(marker, slashSeparator, 2)
|
|
|
|
markerDir = markerSplit[0]
|
|
|
|
if len(markerSplit) == 2 {
|
|
|
|
markerDir += slashSeparator
|
|
|
|
markerBase = markerSplit[1]
|
|
|
|
}
|
|
|
|
}
|
2016-07-18 03:46:52 +05:30
|
|
|
entries, delayIsLeaf, err := listDir(bucket, prefixDir, entryPrefixMatch)
|
2016-05-06 01:21:56 +05:30
|
|
|
if err != nil {
|
2016-05-29 21:05:00 -07:00
|
|
|
select {
|
2016-06-06 00:25:45 +05:30
|
|
|
case <-endWalkCh:
|
2016-06-04 00:03:50 +05:30
|
|
|
return errWalkAbort
|
2016-06-06 00:25:45 +05:30
|
|
|
case resultCh <- treeWalkResult{err: err}:
|
2016-06-04 00:03:50 +05:30
|
|
|
return err
|
2016-05-29 21:05:00 -07:00
|
|
|
}
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
2016-06-04 00:03:50 +05:30
|
|
|
// For an empty list return right here.
|
2016-05-06 01:21:56 +05:30
|
|
|
if len(entries) == 0 {
|
2016-06-04 00:03:50 +05:30
|
|
|
return nil
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
2016-05-20 20:48:47 -07:00
|
|
|
|
2016-05-06 01:21:56 +05:30
|
|
|
// example:
|
|
|
|
// If markerDir="four/" Search() returns the index of "four/" in the sorted
|
|
|
|
// entries list so we skip all the entries till "four/"
|
2016-05-07 02:08:03 -07:00
|
|
|
idx := sort.Search(len(entries), func(i int) bool {
|
2016-05-20 20:48:47 -07:00
|
|
|
return entries[i] >= markerDir
|
2016-05-07 02:08:03 -07:00
|
|
|
})
|
2016-05-06 01:21:56 +05:30
|
|
|
entries = entries[idx:]
|
2016-06-04 00:03:50 +05:30
|
|
|
// For an empty list after search through the entries, return right here.
|
2016-05-29 21:05:00 -07:00
|
|
|
if len(entries) == 0 {
|
2016-06-04 00:03:50 +05:30
|
|
|
return nil
|
2016-05-29 21:05:00 -07:00
|
|
|
}
|
2016-05-06 01:21:56 +05:30
|
|
|
for i, entry := range entries {
|
2016-07-18 03:46:52 +05:30
|
|
|
// Decision to do isLeaf check was pushed from listDir() to here.
|
|
|
|
if delayIsLeaf && isLeaf(bucket, pathJoin(prefixDir, entry)) {
|
|
|
|
entry = strings.TrimSuffix(entry, slashSeparator)
|
|
|
|
}
|
|
|
|
|
2016-05-06 01:21:56 +05:30
|
|
|
if i == 0 && markerDir == entry {
|
|
|
|
if !recursive {
|
|
|
|
// Skip as the marker would already be listed in the previous listing.
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
if recursive && !strings.HasSuffix(entry, slashSeparator) {
|
|
|
|
// We should not skip for recursive listing and if markerDir is a directory
|
|
|
|
// for ex. if marker is "four/five.txt" markerDir will be "four/" which
|
2016-05-30 16:51:59 -07:00
|
|
|
// should not be skipped, instead it will need to be treeWalk()'ed into.
|
2016-05-06 01:21:56 +05:30
|
|
|
|
|
|
|
// Skip if it is a file though as it would be listed in previous listing.
|
|
|
|
continue
|
|
|
|
}
|
|
|
|
}
|
|
|
|
if recursive && strings.HasSuffix(entry, slashSeparator) {
|
|
|
|
// If the entry is a directory, we will need recurse into it.
|
|
|
|
markerArg := ""
|
|
|
|
if entry == markerDir {
|
|
|
|
// We need to pass "five.txt" as marker only if we are
|
|
|
|
// recursing into "four/"
|
|
|
|
markerArg = markerBase
|
|
|
|
}
|
|
|
|
prefixMatch := "" // Valid only for first level treeWalk and empty for subdirectories.
|
2016-06-04 00:03:50 +05:30
|
|
|
// markIsEnd is passed to this entry's treeWalk() so that treeWalker.end can be marked
|
|
|
|
// true at the end of the treeWalk stream.
|
|
|
|
markIsEnd := i == len(entries)-1 && isEnd
|
2016-07-18 03:46:52 +05:30
|
|
|
if tErr := doTreeWalk(bucket, pathJoin(prefixDir, entry), prefixMatch, markerArg, recursive, listDir, isLeaf, resultCh, endWalkCh, markIsEnd); tErr != nil {
|
2016-06-04 00:03:50 +05:30
|
|
|
return tErr
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
|
|
|
continue
|
|
|
|
}
|
2016-06-04 00:03:50 +05:30
|
|
|
// EOF is set if we are at last entry and the caller indicated we at the end.
|
|
|
|
isEOF := ((i == len(entries)-1) && isEnd)
|
2016-05-29 21:05:00 -07:00
|
|
|
select {
|
2016-06-06 00:25:45 +05:30
|
|
|
case <-endWalkCh:
|
2016-06-04 00:03:50 +05:30
|
|
|
return errWalkAbort
|
2016-06-06 00:25:45 +05:30
|
|
|
case resultCh <- treeWalkResult{entry: pathJoin(prefixDir, entry), end: isEOF}:
|
2016-05-29 21:05:00 -07:00
|
|
|
}
|
|
|
|
}
|
2016-06-04 00:03:50 +05:30
|
|
|
|
|
|
|
// Everything is listed.
|
|
|
|
return nil
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
// Initiate a new treeWalk in a goroutine.
|
2016-07-18 03:46:52 +05:30
|
|
|
func startTreeWalk(bucket, prefix, marker string, recursive bool, listDir listDirFunc, isLeaf isLeafFunc, endWalkCh chan struct{}) chan treeWalkResult {
|
2016-05-06 01:21:56 +05:30
|
|
|
// Example 1
|
|
|
|
// If prefix is "one/two/three/" and marker is "one/two/three/four/five.txt"
|
|
|
|
// treeWalk is called with prefixDir="one/two/three/" and marker="four/five.txt"
|
|
|
|
// and entryPrefixMatch=""
|
|
|
|
|
|
|
|
// Example 2
|
|
|
|
// if prefix is "one/two/th" and marker is "one/two/three/four/five.txt"
|
|
|
|
// treeWalk is called with prefixDir="one/two/" and marker="three/four/five.txt"
|
|
|
|
// and entryPrefixMatch="th"
|
|
|
|
|
2016-06-06 00:25:45 +05:30
|
|
|
resultCh := make(chan treeWalkResult, maxObjectList)
|
2016-05-06 01:21:56 +05:30
|
|
|
entryPrefixMatch := prefix
|
|
|
|
prefixDir := ""
|
|
|
|
lastIndex := strings.LastIndex(prefix, slashSeparator)
|
|
|
|
if lastIndex != -1 {
|
|
|
|
entryPrefixMatch = prefix[lastIndex+1:]
|
|
|
|
prefixDir = prefix[:lastIndex+1]
|
|
|
|
}
|
|
|
|
marker = strings.TrimPrefix(marker, prefixDir)
|
2016-06-04 00:03:50 +05:30
|
|
|
go func() {
|
|
|
|
isEnd := true // Indication to start walking the tree with end as true.
|
2016-07-18 03:46:52 +05:30
|
|
|
doTreeWalk(bucket, prefixDir, entryPrefixMatch, marker, recursive, listDir, isLeaf, resultCh, endWalkCh, isEnd)
|
2016-06-06 00:25:45 +05:30
|
|
|
close(resultCh)
|
2016-06-04 00:03:50 +05:30
|
|
|
}()
|
2016-06-06 00:25:45 +05:30
|
|
|
return resultCh
|
2016-05-06 01:21:56 +05:30
|
|
|
}
|