mirror of
https://github.com/minio/minio.git
synced 2024-12-26 23:25:54 -05:00
ad8e611098
Spark/Hadoop workloads which use Hadoop MR Committer v1/v2 algorithm upload objects to a temporary prefix in a bucket. These objects are 'renamed' to a different prefix on Job commit. Object storage admins are forced to configure separate ILM policies to expire these objects and their versions to reclaim space. Our solution: This can be avoided by simply marking objects under these prefixes to be excluded from versioning, as shown below. Consequently, these objects are excluded from replication, and don't require ILM policies to prune unnecessary versions. - MinIO Extension to Bucket Version Configuration ```xml <VersioningConfiguration xmlns="http://s3.amazonaws.com/doc/2006-03-01/"> <Status>Enabled</Status> <ExcludeFolders>true</ExcludeFolders> <ExcludedPrefixes> <Prefix>app1-jobs/*/_temporary/</Prefix> </ExcludedPrefixes> <ExcludedPrefixes> <Prefix>app2-jobs/*/__magic/</Prefix> </ExcludedPrefixes> <!-- .. up to 10 prefixes in all --> </VersioningConfiguration> ``` Note: `ExcludeFolders` excludes all folders in a bucket from versioning. This is required to prevent the parent folders from accumulating delete markers, especially those which are shared across spark workloads spanning projects/teams. - To enable version exclusion on a list of prefixes ``` mc version enable --excluded-prefixes "app1-jobs/*/_temporary/,app2-jobs/*/_magic," --exclude-prefix-marker myminio/test ```
79 lines
2.5 KiB
Go
79 lines
2.5 KiB
Go
// Copyright (c) 2015-2021 MinIO, Inc.
|
|
//
|
|
// This file is part of MinIO Object Storage stack
|
|
//
|
|
// This program is free software: you can redistribute it and/or modify
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
// (at your option) any later version.
|
|
//
|
|
// This program is distributed in the hope that it will be useful
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
// GNU Affero General Public License for more details.
|
|
//
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
package cmd
|
|
|
|
import "github.com/minio/minio/internal/bucket/versioning"
|
|
|
|
// BucketVersioningSys - policy subsystem.
|
|
type BucketVersioningSys struct{}
|
|
|
|
// Enabled enabled versioning?
|
|
func (sys *BucketVersioningSys) Enabled(bucket string) bool {
|
|
vc, err := globalBucketMetadataSys.GetVersioningConfig(bucket)
|
|
if err != nil {
|
|
return false
|
|
}
|
|
return vc.Enabled()
|
|
}
|
|
|
|
// PrefixEnabled returns true is versioning is enabled at bucket level and if
|
|
// the given prefix doesn't match any excluded prefixes pattern. This is
|
|
// part of a MinIO versioning configuration extension.
|
|
func (sys *BucketVersioningSys) PrefixEnabled(bucket, prefix string) bool {
|
|
vc, err := globalBucketMetadataSys.GetVersioningConfig(bucket)
|
|
if err != nil {
|
|
return false
|
|
}
|
|
return vc.PrefixEnabled(prefix)
|
|
}
|
|
|
|
// Suspended suspended versioning?
|
|
func (sys *BucketVersioningSys) Suspended(bucket string) bool {
|
|
vc, err := globalBucketMetadataSys.GetVersioningConfig(bucket)
|
|
if err != nil {
|
|
return false
|
|
}
|
|
return vc.Suspended()
|
|
}
|
|
|
|
// PrefixSuspended returns true if the given prefix matches an excluded prefix
|
|
// pattern. This is part of a MinIO versioning configuration extension.
|
|
func (sys *BucketVersioningSys) PrefixSuspended(bucket, prefix string) bool {
|
|
vc, err := globalBucketMetadataSys.GetVersioningConfig(bucket)
|
|
if err != nil {
|
|
return false
|
|
}
|
|
|
|
return vc.PrefixSuspended(prefix)
|
|
}
|
|
|
|
// Get returns stored bucket policy
|
|
func (sys *BucketVersioningSys) Get(bucket string) (*versioning.Versioning, error) {
|
|
return globalBucketMetadataSys.GetVersioningConfig(bucket)
|
|
}
|
|
|
|
// Reset BucketVersioningSys to initial state.
|
|
func (sys *BucketVersioningSys) Reset() {
|
|
// There is currently no internal state.
|
|
}
|
|
|
|
// NewBucketVersioningSys - creates new versioning system.
|
|
func NewBucketVersioningSys() *BucketVersioningSys {
|
|
return &BucketVersioningSys{}
|
|
}
|