mirror of
https://github.com/minio/minio.git
synced 2025-01-12 15:33:22 -05:00
490c30f853
Just like our single directory/disk setup, this PR brings the functionality to cleanup stale multipart objects older > 2 weeks.
263 lines
7.8 KiB
Go
263 lines
7.8 KiB
Go
/*
|
|
* Minio Cloud Storage, (C) 2016, 2017 Minio, Inc.
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
package cmd
|
|
|
|
import (
|
|
"encoding/json"
|
|
"io"
|
|
"io/ioutil"
|
|
"path"
|
|
"sort"
|
|
"time"
|
|
|
|
"github.com/minio/minio/pkg/errors"
|
|
"github.com/minio/minio/pkg/lock"
|
|
)
|
|
|
|
const (
|
|
// Expiry duration after which the multipart uploads are deemed stale.
|
|
multipartExpiry = time.Hour * 24 * 14 // 2 weeks.
|
|
// Cleanup interval when the stale multipart cleanup is initiated.
|
|
multipartCleanupInterval = time.Hour * 24 // 24 hrs.
|
|
)
|
|
|
|
// A uploadInfo represents the s3 compatible spec.
|
|
type uploadInfo struct {
|
|
UploadID string `json:"uploadId"` // UploadID for the active multipart upload.
|
|
Deleted bool `json:"deleted"` // Currently unused, for future use.
|
|
Initiated time.Time `json:"initiated"` // Indicates when the uploadID was initiated.
|
|
}
|
|
|
|
// A uploadsV1 represents `uploads.json` metadata header.
|
|
type uploadsV1 struct {
|
|
Version string `json:"version"` // Version of the current `uploads.json`
|
|
Format string `json:"format"` // Format of the current `uploads.json`
|
|
Uploads []uploadInfo `json:"uploadIds"` // Captures all the upload ids for a given object.
|
|
}
|
|
|
|
// byInitiatedTime is a collection satisfying sort.Interface.
|
|
type byInitiatedTime []uploadInfo
|
|
|
|
func (t byInitiatedTime) Len() int { return len(t) }
|
|
func (t byInitiatedTime) Swap(i, j int) { t[i], t[j] = t[j], t[i] }
|
|
func (t byInitiatedTime) Less(i, j int) bool {
|
|
return t[i].Initiated.Before(t[j].Initiated)
|
|
}
|
|
|
|
// AddUploadID - adds a new upload id in order of its initiated time.
|
|
func (u *uploadsV1) AddUploadID(uploadID string, initiated time.Time) {
|
|
u.Uploads = append(u.Uploads, uploadInfo{
|
|
UploadID: uploadID,
|
|
Initiated: initiated,
|
|
})
|
|
sort.Sort(byInitiatedTime(u.Uploads))
|
|
}
|
|
|
|
// RemoveUploadID - removes upload id from uploads metadata.
|
|
func (u *uploadsV1) RemoveUploadID(uploadID string) {
|
|
// If the uploadID is absent, we do nothing.
|
|
for i, uInfo := range u.Uploads {
|
|
if uInfo.UploadID == uploadID {
|
|
u.Uploads = append(u.Uploads[:i], u.Uploads[i+1:]...)
|
|
break
|
|
}
|
|
}
|
|
}
|
|
|
|
// IsEmpty - is true if no more uploads available.
|
|
func (u *uploadsV1) IsEmpty() bool {
|
|
return len(u.Uploads) == 0
|
|
}
|
|
|
|
func (u *uploadsV1) WriteTo(lk *lock.LockedFile) (n int64, err error) {
|
|
// Serialize to prepare to write to disk.
|
|
var uplBytes []byte
|
|
uplBytes, err = json.Marshal(u)
|
|
if err != nil {
|
|
return 0, errors.Trace(err)
|
|
}
|
|
if err = lk.Truncate(0); err != nil {
|
|
return 0, errors.Trace(err)
|
|
}
|
|
_, err = lk.Write(uplBytes)
|
|
if err != nil {
|
|
return 0, errors.Trace(err)
|
|
}
|
|
return int64(len(uplBytes)), nil
|
|
}
|
|
|
|
func (u *uploadsV1) ReadFrom(lk *lock.LockedFile) (n int64, err error) {
|
|
var uploadIDBytes []byte
|
|
fi, err := lk.Stat()
|
|
if err != nil {
|
|
return 0, errors.Trace(err)
|
|
}
|
|
uploadIDBytes, err = ioutil.ReadAll(io.NewSectionReader(lk, 0, fi.Size()))
|
|
if err != nil {
|
|
return 0, errors.Trace(err)
|
|
}
|
|
if len(uploadIDBytes) == 0 {
|
|
return 0, errors.Trace(io.EOF)
|
|
}
|
|
// Decode `uploads.json`.
|
|
if err = json.Unmarshal(uploadIDBytes, u); err != nil {
|
|
return 0, errors.Trace(err)
|
|
}
|
|
return int64(len(uploadIDBytes)), nil
|
|
}
|
|
|
|
// readUploadsJSON - get all the saved uploads JSON.
|
|
func readUploadsJSON(bucket, object string, disk StorageAPI) (uploadIDs uploadsV1, err error) {
|
|
uploadJSONPath := path.Join(bucket, object, uploadsJSONFile)
|
|
// Reads entire `uploads.json`.
|
|
buf, err := disk.ReadAll(minioMetaMultipartBucket, uploadJSONPath)
|
|
if err != nil {
|
|
return uploadsV1{}, errors.Trace(err)
|
|
}
|
|
|
|
// Decode `uploads.json`.
|
|
if err = json.Unmarshal(buf, &uploadIDs); err != nil {
|
|
return uploadsV1{}, errors.Trace(err)
|
|
}
|
|
|
|
// Success.
|
|
return uploadIDs, nil
|
|
}
|
|
|
|
// newUploadsV1 - initialize new uploads v1.
|
|
func newUploadsV1(format string) uploadsV1 {
|
|
uploadIDs := uploadsV1{}
|
|
uploadIDs.Version = "1.0.0" // Should follow semantic versioning.
|
|
uploadIDs.Format = format
|
|
return uploadIDs
|
|
}
|
|
|
|
func writeUploadJSON(u *uploadsV1, uploadsPath, tmpPath string, disk StorageAPI) error {
|
|
// Serialize to prepare to write to disk.
|
|
uplBytes, wErr := json.Marshal(&u)
|
|
if wErr != nil {
|
|
return errors.Trace(wErr)
|
|
}
|
|
|
|
// Write `uploads.json` to disk. First to tmp location and then rename.
|
|
if wErr = disk.AppendFile(minioMetaTmpBucket, tmpPath, uplBytes); wErr != nil {
|
|
return errors.Trace(wErr)
|
|
}
|
|
wErr = disk.RenameFile(minioMetaTmpBucket, tmpPath, minioMetaMultipartBucket, uploadsPath)
|
|
if wErr != nil {
|
|
if dErr := disk.DeleteFile(minioMetaTmpBucket, tmpPath); dErr != nil {
|
|
// we return the most recent error.
|
|
return errors.Trace(dErr)
|
|
}
|
|
return errors.Trace(wErr)
|
|
}
|
|
return nil
|
|
}
|
|
|
|
// listMultipartUploadIDs - list all the upload ids from a marker up to 'count'.
|
|
func listMultipartUploadIDs(bucketName, objectName, uploadIDMarker string, count int, disk StorageAPI) ([]MultipartInfo, bool, error) {
|
|
var uploads []MultipartInfo
|
|
// Read `uploads.json`.
|
|
uploadsJSON, err := readUploadsJSON(bucketName, objectName, disk)
|
|
if err != nil {
|
|
switch errors.Cause(err) {
|
|
case errFileNotFound, errFileAccessDenied:
|
|
return nil, true, nil
|
|
}
|
|
return nil, false, err
|
|
}
|
|
index := 0
|
|
if uploadIDMarker != "" {
|
|
for ; index < len(uploadsJSON.Uploads); index++ {
|
|
if uploadsJSON.Uploads[index].UploadID == uploadIDMarker {
|
|
// Skip the uploadID as it would already be listed in previous listing.
|
|
index++
|
|
break
|
|
}
|
|
}
|
|
}
|
|
for index < len(uploadsJSON.Uploads) {
|
|
uploads = append(uploads, MultipartInfo{
|
|
Object: objectName,
|
|
UploadID: uploadsJSON.Uploads[index].UploadID,
|
|
Initiated: uploadsJSON.Uploads[index].Initiated,
|
|
})
|
|
count--
|
|
index++
|
|
if count == 0 {
|
|
break
|
|
}
|
|
}
|
|
end := (index == len(uploadsJSON.Uploads))
|
|
return uploads, end, nil
|
|
}
|
|
|
|
// List multipart uploads func defines the function signature of list multipart recursive function.
|
|
type listMultipartUploadsFunc func(bucket, prefix, keyMarker, uploadIDMarker, delimiter string, maxUploads int) (ListMultipartsInfo, error)
|
|
|
|
// Removes multipart uploads if any older than `expiry` duration
|
|
// on all buckets for every `cleanupInterval`, this function is
|
|
// blocking and should be run in a go-routine.
|
|
func cleanupStaleMultipartUploads(cleanupInterval, expiry time.Duration, obj ObjectLayer, listFn listMultipartUploadsFunc, doneCh chan struct{}) {
|
|
ticker := time.NewTicker(cleanupInterval)
|
|
for {
|
|
select {
|
|
case <-doneCh:
|
|
// Stop the timer.
|
|
ticker.Stop()
|
|
return
|
|
case <-ticker.C:
|
|
bucketInfos, err := obj.ListBuckets()
|
|
if err != nil {
|
|
errorIf(err, "Unable to list buckets")
|
|
continue
|
|
}
|
|
for _, bucketInfo := range bucketInfos {
|
|
cleanupStaleMultipartUpload(bucketInfo.Name, expiry, obj, listFn)
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
// Removes multipart uploads if any older than `expiry` duration in a given bucket.
|
|
func cleanupStaleMultipartUpload(bucket string, expiry time.Duration, obj ObjectLayer, listFn listMultipartUploadsFunc) (err error) {
|
|
var lmi ListMultipartsInfo
|
|
for {
|
|
// List multipart uploads in a bucket 1000 at a time
|
|
prefix := ""
|
|
lmi, err = listFn(bucket, prefix, lmi.KeyMarker, lmi.UploadIDMarker, "", 1000)
|
|
if err != nil {
|
|
errorIf(err, "Unable to list uploads")
|
|
return err
|
|
}
|
|
|
|
// Remove uploads (and its parts) older than expiry duration.
|
|
for _, upload := range lmi.Uploads {
|
|
if time.Since(upload.Initiated) > expiry {
|
|
obj.AbortMultipartUpload(bucket, upload.Object, upload.UploadID)
|
|
}
|
|
}
|
|
|
|
// No more incomplete uploads remain, break and return.
|
|
if !lmi.IsTruncated {
|
|
break
|
|
}
|
|
}
|
|
|
|
return nil
|
|
}
|