2016-04-04 19:55:07 -07:00
|
|
|
/*
|
|
|
|
* Minio Cloud Storage, (C) 2016 Minio, Inc.
|
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
2016-04-05 05:57:55 +05:30
|
|
|
package main
|
|
|
|
|
|
|
|
import (
|
|
|
|
"os"
|
|
|
|
"path/filepath"
|
|
|
|
"sort"
|
|
|
|
"strings"
|
|
|
|
"time"
|
|
|
|
)
|
|
|
|
|
2016-04-04 19:55:07 -07:00
|
|
|
// fsDirent carries directory entries.
|
2016-04-05 05:57:55 +05:30
|
|
|
type fsDirent struct {
|
2016-04-09 00:16:03 +05:30
|
|
|
name string
|
|
|
|
modTime time.Time // On Solaris and older unix distros this is empty.
|
|
|
|
size int64 // On Solaris and older unix distros this is empty.
|
|
|
|
mode os.FileMode
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|
|
|
|
|
2016-04-09 00:16:03 +05:30
|
|
|
// IsDir - returns true if fsDirent is a directory
|
|
|
|
func (ent fsDirent) IsDir() bool {
|
|
|
|
return ent.mode.IsDir()
|
|
|
|
}
|
2016-04-05 05:57:55 +05:30
|
|
|
|
2016-04-09 00:16:03 +05:30
|
|
|
// IsSymlink - returns true if fsDirent is a symbolic link
|
|
|
|
func (ent fsDirent) IsSymlink() bool {
|
|
|
|
return ent.mode&os.ModeSymlink == os.ModeSymlink
|
|
|
|
}
|
2016-04-05 05:57:55 +05:30
|
|
|
|
2016-04-09 00:16:03 +05:30
|
|
|
// IsRegular - returns true if fsDirent is a regular file
|
|
|
|
func (ent fsDirent) IsRegular() bool {
|
|
|
|
return ent.mode.IsRegular()
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|
|
|
|
|
2016-04-09 00:16:03 +05:30
|
|
|
// byDirentName is a collection satisfying sort.Interface.
|
|
|
|
type byDirentName []fsDirent
|
|
|
|
|
|
|
|
func (d byDirentName) Len() int { return len(d) }
|
|
|
|
func (d byDirentName) Swap(i, j int) { d[i], d[j] = d[j], d[i] }
|
|
|
|
func (d byDirentName) Less(i, j int) bool { return d[i].name < d[j].name }
|
|
|
|
|
2016-04-08 23:07:38 +05:30
|
|
|
// Using sort.Search() internally to jump to the file entry containing
|
|
|
|
// the prefix.
|
2016-04-05 05:57:55 +05:30
|
|
|
func searchDirents(dirents []fsDirent, x string) int {
|
|
|
|
processFunc := func(i int) bool {
|
|
|
|
return dirents[i].name >= x
|
|
|
|
}
|
|
|
|
return sort.Search(len(dirents), processFunc)
|
|
|
|
}
|
|
|
|
|
2016-04-04 19:55:07 -07:00
|
|
|
// Tree walk result carries results of tree walking.
|
2016-04-05 05:57:55 +05:30
|
|
|
type treeWalkResult struct {
|
2016-04-08 23:07:38 +05:30
|
|
|
fileInfo FileInfo
|
|
|
|
err error
|
|
|
|
end bool
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|
|
|
|
|
2016-04-04 19:55:07 -07:00
|
|
|
// Tree walk notify carries a channel which notifies tree walk
|
|
|
|
// results, additionally it also carries information if treeWalk
|
|
|
|
// should be timedOut.
|
2016-04-05 05:57:55 +05:30
|
|
|
type treeWalker struct {
|
|
|
|
ch <-chan treeWalkResult
|
|
|
|
timedOut bool
|
|
|
|
}
|
|
|
|
|
2016-04-08 23:07:38 +05:30
|
|
|
// treeWalk walks FS directory tree recursively pushing fileInfo into the channel as and when it encounters files.
|
2016-04-05 05:57:55 +05:30
|
|
|
func treeWalk(bucketDir, prefixDir, entryPrefixMatch, marker string, recursive bool, send func(treeWalkResult) bool, count *int) bool {
|
|
|
|
// Example:
|
|
|
|
// if prefixDir="one/two/three/" and marker="four/five.txt" treeWalk is recursively
|
|
|
|
// called with prefixDir="one/two/three/four/" and marker="five.txt"
|
|
|
|
|
2016-04-08 23:07:38 +05:30
|
|
|
// Convert dirent to FileInfo
|
|
|
|
direntToFileInfo := func(dirent fsDirent) (FileInfo, error) {
|
|
|
|
fileInfo := FileInfo{}
|
2016-04-04 19:55:07 -07:00
|
|
|
// Convert to full object name.
|
2016-04-08 23:07:38 +05:30
|
|
|
fileInfo.Name = filepath.Join(prefixDir, dirent.name)
|
2016-04-09 00:16:03 +05:30
|
|
|
if dirent.modTime.IsZero() && dirent.size == 0 {
|
2016-04-05 05:57:55 +05:30
|
|
|
// ModifiedTime and Size are zero, Stat() and figure out
|
|
|
|
// the actual values that need to be set.
|
|
|
|
fi, err := os.Stat(filepath.Join(bucketDir, prefixDir, dirent.name))
|
|
|
|
if err != nil {
|
2016-04-08 23:07:38 +05:30
|
|
|
return FileInfo{}, err
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|
2016-04-04 19:55:07 -07:00
|
|
|
// Fill size and modtime.
|
2016-04-08 23:07:38 +05:30
|
|
|
fileInfo.ModTime = fi.ModTime()
|
|
|
|
fileInfo.Size = fi.Size()
|
|
|
|
fileInfo.Mode = fi.Mode()
|
2016-04-05 05:57:55 +05:30
|
|
|
} else {
|
2016-04-08 23:07:38 +05:30
|
|
|
// If ModTime or Size are set then use them
|
2016-04-05 05:57:55 +05:30
|
|
|
// without attempting another Stat operation.
|
2016-04-08 23:07:38 +05:30
|
|
|
fileInfo.ModTime = dirent.modTime
|
|
|
|
fileInfo.Size = dirent.size
|
|
|
|
fileInfo.Mode = dirent.mode
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|
2016-04-08 23:07:38 +05:30
|
|
|
if fileInfo.Mode.IsDir() {
|
2016-04-04 19:55:07 -07:00
|
|
|
// Add os.PathSeparator suffix again for directories as
|
|
|
|
// filepath.Join would have removed it.
|
2016-04-08 23:07:38 +05:30
|
|
|
fileInfo.Size = 0
|
|
|
|
fileInfo.Name += string(os.PathSeparator)
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|
2016-04-08 23:07:38 +05:30
|
|
|
return fileInfo, nil
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|
|
|
|
|
2016-04-04 19:55:07 -07:00
|
|
|
var markerBase, markerDir string
|
2016-04-05 05:57:55 +05:30
|
|
|
if marker != "" {
|
2016-04-04 19:55:07 -07:00
|
|
|
// Ex: if marker="four/five.txt", markerDir="four/" markerBase="five.txt"
|
2016-04-05 05:57:55 +05:30
|
|
|
markerSplit := strings.SplitN(marker, string(os.PathSeparator), 2)
|
2016-04-04 19:55:07 -07:00
|
|
|
markerDir = markerSplit[0]
|
2016-04-05 05:57:55 +05:30
|
|
|
if len(markerSplit) == 2 {
|
2016-04-04 19:55:07 -07:00
|
|
|
markerDir += string(os.PathSeparator)
|
|
|
|
markerBase = markerSplit[1]
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-16 12:48:41 -07:00
|
|
|
// Entry prefix match function.
|
|
|
|
prefixMatchFn := func(dirent fsDirent) bool {
|
|
|
|
if dirent.IsDir() || dirent.IsRegular() {
|
|
|
|
// Does dirent name has reserved prefixes or suffixes.
|
|
|
|
hasReserved := hasReservedPrefix(dirent.name) || hasReservedSuffix(dirent.name)
|
|
|
|
// All dirents which match prefix and do not have reserved
|
|
|
|
// keywords in them are valid entries.
|
2016-04-16 19:33:29 -07:00
|
|
|
return strings.HasPrefix(dirent.name, entryPrefixMatch) && !hasReserved && isValidPath(dirent.name)
|
2016-04-16 12:48:41 -07:00
|
|
|
}
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
|
|
|
// scandir returns entries that begins with entryPrefixMatch
|
|
|
|
dirents, err := scandir(filepath.Join(bucketDir, prefixDir), prefixMatchFn, true)
|
2016-04-05 05:57:55 +05:30
|
|
|
if err != nil {
|
|
|
|
send(treeWalkResult{err: err})
|
|
|
|
return false
|
|
|
|
}
|
2016-04-16 12:48:41 -07:00
|
|
|
|
2016-04-05 05:57:55 +05:30
|
|
|
// example:
|
2016-04-04 19:55:07 -07:00
|
|
|
// If markerDir="four/" searchDirents() returns the index of "four/" in the sorted
|
2016-04-05 05:57:55 +05:30
|
|
|
// dirents list. We skip all the dirent entries till "four/"
|
2016-04-04 19:55:07 -07:00
|
|
|
dirents = dirents[searchDirents(dirents, markerDir):]
|
2016-04-05 05:57:55 +05:30
|
|
|
*count += len(dirents)
|
|
|
|
for i, dirent := range dirents {
|
2016-04-09 00:16:03 +05:30
|
|
|
if i == 0 && markerDir == dirent.name && !dirent.IsDir() {
|
2016-04-05 05:57:55 +05:30
|
|
|
// If the first entry is not a directory
|
|
|
|
// we need to skip this entry.
|
|
|
|
*count--
|
|
|
|
continue
|
|
|
|
}
|
2016-04-09 00:16:03 +05:30
|
|
|
if dirent.IsDir() && recursive {
|
2016-04-05 05:57:55 +05:30
|
|
|
// If the entry is a directory, we will need recurse into it.
|
|
|
|
markerArg := ""
|
2016-04-04 19:55:07 -07:00
|
|
|
if dirent.name == markerDir {
|
|
|
|
// We need to pass "five.txt" as marker only if we are
|
|
|
|
// recursing into "four/"
|
|
|
|
markerArg = markerBase
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|
|
|
|
*count--
|
|
|
|
if !treeWalk(bucketDir, filepath.Join(prefixDir, dirent.name), "", markerArg, recursive, send, count) {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
continue
|
|
|
|
}
|
2016-04-08 23:07:38 +05:30
|
|
|
fileInfo, err := direntToFileInfo(dirent)
|
2016-04-05 05:57:55 +05:30
|
|
|
if err != nil {
|
|
|
|
send(treeWalkResult{err: err})
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
*count--
|
2016-04-08 23:07:38 +05:30
|
|
|
if !send(treeWalkResult{fileInfo: fileInfo}) {
|
2016-04-05 05:57:55 +05:30
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
|
|
|
// Initiate a new treeWalk in a goroutine.
|
2016-04-04 19:55:07 -07:00
|
|
|
func startTreeWalk(fsPath, bucket, prefix, marker string, recursive bool) *treeWalker {
|
2016-04-05 05:57:55 +05:30
|
|
|
// Example 1
|
|
|
|
// If prefix is "one/two/three/" and marker is "one/two/three/four/five.txt"
|
|
|
|
// treeWalk is called with prefixDir="one/two/three/" and marker="four/five.txt"
|
|
|
|
// and entryPrefixMatch=""
|
|
|
|
|
|
|
|
// Example 2
|
|
|
|
// if prefix is "one/two/th" and marker is "one/two/three/four/five.txt"
|
|
|
|
// treeWalk is called with prefixDir="one/two/" and marker="three/four/five.txt"
|
|
|
|
// and entryPrefixMatch="th"
|
2016-04-08 23:07:38 +05:30
|
|
|
ch := make(chan treeWalkResult, fsListLimit)
|
2016-04-04 19:55:07 -07:00
|
|
|
walkNotify := treeWalker{ch: ch}
|
2016-04-05 05:57:55 +05:30
|
|
|
entryPrefixMatch := prefix
|
|
|
|
prefixDir := ""
|
|
|
|
lastIndex := strings.LastIndex(prefix, string(os.PathSeparator))
|
|
|
|
if lastIndex != -1 {
|
|
|
|
entryPrefixMatch = prefix[lastIndex+1:]
|
|
|
|
prefixDir = prefix[:lastIndex+1]
|
|
|
|
}
|
|
|
|
count := 0
|
|
|
|
marker = strings.TrimPrefix(marker, prefixDir)
|
|
|
|
go func() {
|
|
|
|
defer close(ch)
|
|
|
|
send := func(walkResult treeWalkResult) bool {
|
|
|
|
if count == 0 {
|
|
|
|
walkResult.end = true
|
|
|
|
}
|
|
|
|
timer := time.After(time.Second * 60)
|
|
|
|
select {
|
|
|
|
case ch <- walkResult:
|
|
|
|
return true
|
|
|
|
case <-timer:
|
2016-04-04 19:55:07 -07:00
|
|
|
walkNotify.timedOut = true
|
2016-04-05 05:57:55 +05:30
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
2016-04-08 17:13:16 -07:00
|
|
|
bucketDir := filepath.Join(fsPath, bucket)
|
|
|
|
treeWalk(bucketDir, prefixDir, entryPrefixMatch, marker, recursive, send, &count)
|
2016-04-05 05:57:55 +05:30
|
|
|
}()
|
2016-04-04 19:55:07 -07:00
|
|
|
return &walkNotify
|
2016-04-05 05:57:55 +05:30
|
|
|
}
|