2016-05-04 15:18:20 -04:00
/ *
2019-04-09 14:39:42 -04:00
* MinIO Cloud Storage , ( C ) 2016 , 2017 , 2018 MinIO , Inc .
2016-05-04 15:18:20 -04:00
*
* Licensed under the Apache License , Version 2.0 ( the "License" ) ;
* you may not use this file except in compliance with the License .
* You may obtain a copy of the License at
*
* http : //www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing , software
* distributed under the License is distributed on an "AS IS" BASIS ,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND , either express or implied .
* See the License for the specific language governing permissions and
* limitations under the License .
* /
2016-08-18 19:23:42 -04:00
package cmd
2016-05-04 15:18:20 -04:00
2016-05-07 03:59:43 -04:00
import (
2019-09-24 21:47:26 -04:00
"bytes"
2018-04-05 18:04:40 -04:00
"context"
2020-01-13 16:09:10 -05:00
"encoding/hex"
2016-05-07 03:59:43 -04:00
"encoding/json"
"fmt"
2018-02-15 20:45:57 -05:00
"io/ioutil"
2018-07-18 23:17:35 -04:00
"reflect"
2020-01-13 16:09:10 -05:00
"sync"
2018-02-15 20:45:57 -05:00
2018-02-20 21:42:09 -05:00
humanize "github.com/dustin/go-humanize"
2020-05-26 12:32:33 -04:00
"github.com/minio/minio/cmd/config"
2020-01-13 16:09:10 -05:00
"github.com/minio/minio/cmd/config/storageclass"
2018-07-18 23:17:35 -04:00
"github.com/minio/minio/cmd/logger"
2020-01-13 16:09:10 -05:00
"github.com/minio/minio/pkg/color"
2019-10-14 12:44:51 -04:00
"github.com/minio/minio/pkg/sync/errgroup"
2018-02-20 21:42:09 -05:00
sha256 "github.com/minio/sha256-simd"
2017-06-12 20:40:28 -04:00
)
const (
// Represents XL backend.
formatBackendXL = "xl"
2018-02-15 20:45:57 -05:00
// formatXLV1.XL.Version - version '1'.
2018-01-08 17:30:55 -05:00
formatXLVersionV1 = "1"
2018-02-15 20:45:57 -05:00
// formatXLV2.XL.Version - version '2'.
formatXLVersionV2 = "2"
2018-03-15 16:55:23 -04:00
// formatXLV3.XL.Version - version '3'.
formatXLVersionV3 = "3"
2018-02-15 20:45:57 -05:00
// Distribution algorithm used.
formatXLVersionV2DistributionAlgo = "CRCMOD"
2018-01-08 17:30:55 -05:00
)
2017-06-12 20:40:28 -04:00
2018-02-15 20:45:57 -05:00
// Offline disk UUID represents an offline disk.
const offlineDiskUUID = "ffffffff-ffff-ffff-ffff-ffffffffffff"
// Healing is only supported for the list of errors mentioned here.
var formatHealErrors = map [ error ] struct { } {
errUnformattedDisk : { } ,
errDiskNotFound : { } ,
}
// List of errors considered critical for disk formatting.
var formatCriticalErrors = map [ error ] struct { } {
errCorruptedFormat : { } ,
errFaultyDisk : { } ,
}
// Used to detect the version of "xl" format.
type formatXLVersionDetect struct {
XL struct {
Version string ` json:"version" `
} ` json:"xl" `
}
// Represents the V1 backend disk structure version
// under `.minio.sys` and actual data namespace.
2018-01-08 17:30:55 -05:00
// formatXLV1 - structure holds format config version '1'.
type formatXLV1 struct {
formatMetaV1
XL struct {
Version string ` json:"version" ` // Version of 'xl' format.
Disk string ` json:"disk" ` // Disk field carries assigned disk uuid.
// JBOD field carries the input disk order generated the first
// time when fresh disks were supplied.
JBOD [ ] string ` json:"jbod" `
} ` json:"xl" ` // XL field holds xl format.
2017-06-12 20:40:28 -04:00
}
2018-02-15 20:45:57 -05:00
// Represents the V2 backend disk structure version
// under `.minio.sys` and actual data namespace.
// formatXLV2 - structure holds format config version '2'.
2018-07-16 23:26:42 -04:00
// The V2 format to support "large bucket" support where a bucket
// can span multiple erasure sets.
2018-02-15 20:45:57 -05:00
type formatXLV2 struct {
2018-07-16 23:26:42 -04:00
formatMetaV1
XL struct {
2018-02-15 20:45:57 -05:00
Version string ` json:"version" ` // Version of 'xl' format.
This string ` json:"this" ` // This field carries assigned disk uuid.
// Sets field carries the input disk order generated the first
// time when fresh disks were supplied, it is a two dimensional
// array second dimension represents list of disks used per set.
Sets [ ] [ ] string ` json:"sets" `
// Distribution algorithm represents the hashing algorithm
// to pick the right set index for an object.
DistributionAlgo string ` json:"distributionAlgo" `
} ` json:"xl" `
}
2018-03-15 16:55:23 -04:00
// formatXLV3 struct is same as formatXLV2 struct except that formatXLV3.XL.Version is "3" indicating
// the simplified multipart backend which is a flat hierarchy now.
// In .minio.sys/multipart we have:
// sha256(bucket/object)/uploadID/[xl.json, part.1, part.2 ....]
type formatXLV3 struct {
2018-07-16 23:26:42 -04:00
formatMetaV1
XL struct {
2018-03-15 16:55:23 -04:00
Version string ` json:"version" ` // Version of 'xl' format.
This string ` json:"this" ` // This field carries assigned disk uuid.
// Sets field carries the input disk order generated the first
// time when fresh disks were supplied, it is a two dimensional
// array second dimension represents list of disks used per set.
Sets [ ] [ ] string ` json:"sets" `
// Distribution algorithm represents the hashing algorithm
// to pick the right set index for an object.
DistributionAlgo string ` json:"distributionAlgo" `
} ` json:"xl" `
}
2019-11-21 07:24:51 -05:00
func ( f * formatXLV3 ) Clone ( ) * formatXLV3 {
b , err := json . Marshal ( f )
if err != nil {
panic ( err )
}
var dst formatXLV3
if err = json . Unmarshal ( b , & dst ) ; err != nil {
panic ( err )
}
return & dst
}
2018-02-15 20:45:57 -05:00
// Returns formatXL.XL.Version
2018-03-15 16:55:23 -04:00
func newFormatXLV3 ( numSets int , setLen int ) * formatXLV3 {
format := & formatXLV3 { }
2018-02-15 20:45:57 -05:00
format . Version = formatMetaVersionV1
format . Format = formatBackendXL
2018-07-18 23:17:35 -04:00
format . ID = mustGetUUID ( )
2018-03-15 16:55:23 -04:00
format . XL . Version = formatXLVersionV3
2018-02-15 20:45:57 -05:00
format . XL . DistributionAlgo = formatXLVersionV2DistributionAlgo
format . XL . Sets = make ( [ ] [ ] string , numSets )
for i := 0 ; i < numSets ; i ++ {
format . XL . Sets [ i ] = make ( [ ] string , setLen )
for j := 0 ; j < setLen ; j ++ {
format . XL . Sets [ i ] [ j ] = mustGetUUID ( )
}
}
return format
}
2019-12-23 19:31:03 -05:00
// Returns format XL version after reading `format.json`, returns
// successfully the version only if the backend is XL.
func formatGetBackendXLVersion ( formatPath string ) ( string , error ) {
2018-02-15 20:45:57 -05:00
meta := & formatMetaV1 { }
b , err := ioutil . ReadFile ( formatPath )
if err != nil {
return "" , err
}
if err = json . Unmarshal ( b , meta ) ; err != nil {
return "" , err
}
if meta . Version != formatMetaVersionV1 {
return "" , fmt . Errorf ( ` format.Version expected: %s, got: %s ` , formatMetaVersionV1 , meta . Version )
}
2019-12-23 19:31:03 -05:00
if meta . Format != formatBackendXL {
return "" , fmt . Errorf ( ` found backend %s, expected %s ` , meta . Format , formatBackendXL )
}
// XL backend found, proceed to detect version.
format := & formatXLVersionDetect { }
if err = json . Unmarshal ( b , format ) ; err != nil {
return "" , err
}
return format . XL . Version , nil
2018-02-15 20:45:57 -05:00
}
// Migrates all previous versions to latest version of `format.json`,
// this code calls migration in sequence, such as V1 is migrated to V2
// first before it V2 migrates to V3.
func formatXLMigrate ( export string ) error {
formatPath := pathJoin ( export , minioMetaBucket , formatConfigFile )
2019-12-23 19:31:03 -05:00
version , err := formatGetBackendXLVersion ( formatPath )
2018-02-15 20:45:57 -05:00
if err != nil {
return err
}
switch version {
case formatXLVersionV1 :
2019-12-23 19:31:03 -05:00
if err = formatXLMigrateV1ToV2 ( export , version ) ; err != nil {
2018-02-15 20:45:57 -05:00
return err
}
2019-12-23 19:31:03 -05:00
// Migrate successful v1 => v2, proceed to v2 => v3
version = formatXLVersionV2
2018-02-15 20:45:57 -05:00
fallthrough
case formatXLVersionV2 :
2019-12-23 19:31:03 -05:00
if err = formatXLMigrateV2ToV3 ( export , version ) ; err != nil {
2018-03-15 16:55:23 -04:00
return err
}
2019-12-23 19:31:03 -05:00
// Migrate successful v2 => v3, v3 is latest
2020-05-18 12:59:45 -04:00
// version = formatXLVersionV3
2018-03-15 16:55:23 -04:00
fallthrough
case formatXLVersionV3 :
2019-12-23 19:31:03 -05:00
// v3 is the latest version, return.
2018-02-15 20:45:57 -05:00
return nil
}
return fmt . Errorf ( ` %s: unknown format version %s ` , export , version )
}
// Migrates version V1 of format.json to version V2 of format.json,
// migration fails upon any error.
2019-12-23 19:31:03 -05:00
func formatXLMigrateV1ToV2 ( export , version string ) error {
2018-02-15 20:45:57 -05:00
if version != formatXLVersionV1 {
return fmt . Errorf ( ` Disk %s: format version expected %s, found %s ` , export , formatXLVersionV1 , version )
}
2019-12-23 19:31:03 -05:00
formatPath := pathJoin ( export , minioMetaBucket , formatConfigFile )
2018-02-15 20:45:57 -05:00
formatV1 := & formatXLV1 { }
b , err := ioutil . ReadFile ( formatPath )
if err != nil {
return err
}
if err = json . Unmarshal ( b , formatV1 ) ; err != nil {
return err
}
2016-06-02 19:34:15 -04:00
2018-03-15 16:55:23 -04:00
formatV2 := & formatXLV2 { }
formatV2 . Version = formatMetaVersionV1
formatV2 . Format = formatBackendXL
formatV2 . XL . Version = formatXLVersionV2
formatV2 . XL . DistributionAlgo = formatXLVersionV2DistributionAlgo
2018-03-19 12:13:00 -04:00
formatV2 . XL . This = formatV1 . XL . Disk
2018-03-15 16:55:23 -04:00
formatV2 . XL . Sets = make ( [ ] [ ] string , 1 )
formatV2 . XL . Sets [ 0 ] = make ( [ ] string , len ( formatV1 . XL . JBOD ) )
2018-02-15 20:45:57 -05:00
copy ( formatV2 . XL . Sets [ 0 ] , formatV1 . XL . JBOD )
b , err = json . Marshal ( formatV2 )
if err != nil {
return err
}
return ioutil . WriteFile ( formatPath , b , 0644 )
}
2017-08-03 07:37:02 -04:00
2018-03-15 16:55:23 -04:00
// Migrates V2 for format.json to V3 (Flat hierarchy for multipart)
2019-12-23 19:31:03 -05:00
func formatXLMigrateV2ToV3 ( export , version string ) error {
2018-03-15 16:55:23 -04:00
if version != formatXLVersionV2 {
return fmt . Errorf ( ` Disk %s: format version expected %s, found %s ` , export , formatXLVersionV2 , version )
}
2019-12-23 19:31:03 -05:00
formatPath := pathJoin ( export , minioMetaBucket , formatConfigFile )
2018-03-15 16:55:23 -04:00
formatV2 := & formatXLV2 { }
b , err := ioutil . ReadFile ( formatPath )
if err != nil {
return err
}
err = json . Unmarshal ( b , formatV2 )
if err != nil {
return err
}
2018-08-06 00:15:28 -04:00
if err = removeAll ( pathJoin ( export , minioMetaMultipartBucket ) ) ; err != nil {
2018-03-15 16:55:23 -04:00
return err
}
2018-08-06 00:15:28 -04:00
if err = mkdirAll ( pathJoin ( export , minioMetaMultipartBucket ) , 0755 ) ; err != nil {
2018-03-15 16:55:23 -04:00
return err
}
// format-V2 struct is exactly same as format-V1 except that version is "3"
// which indicates the simplified multipart backend.
formatV3 := formatXLV3 { }
formatV3 . Version = formatV2 . Version
formatV3 . Format = formatV2 . Format
formatV3 . XL = formatV2 . XL
formatV3 . XL . Version = formatXLVersionV3
b , err = json . Marshal ( formatV3 )
if err != nil {
return err
}
return ioutil . WriteFile ( formatPath , b , 0644 )
}
2018-02-15 20:45:57 -05:00
// countErrs - count a specific error.
func countErrs ( errs [ ] error , err error ) int {
var i = 0
for _ , err1 := range errs {
2018-04-10 12:36:37 -04:00
if err1 == err {
2018-02-15 20:45:57 -05:00
i ++
}
}
return i
2016-06-02 19:34:15 -04:00
}
2018-02-15 20:45:57 -05:00
// Does all errors indicate we need to initialize all disks?.
func shouldInitXLDisks ( errs [ ] error ) bool {
return countErrs ( errs , errUnformattedDisk ) == len ( errs )
}
2018-04-12 18:43:38 -04:00
// Check if unformatted disks are equal to write quorum.
func quorumUnformattedDisks ( errs [ ] error ) bool {
return countErrs ( errs , errUnformattedDisk ) >= ( len ( errs ) / 2 ) + 1
}
2018-02-15 20:45:57 -05:00
// loadFormatXLAll - load all format config from all input disks in parallel.
2020-03-27 17:48:30 -04:00
func loadFormatXLAll ( storageDisks [ ] StorageAPI , heal bool ) ( [ ] * formatXLV3 , [ ] error ) {
2016-06-02 19:34:15 -04:00
// Initialize list of errors.
2019-10-14 12:44:51 -04:00
g := errgroup . WithNErrs ( len ( storageDisks ) )
2016-06-02 19:34:15 -04:00
// Initialize format configs.
2018-04-04 00:58:48 -04:00
var formats = make ( [ ] * formatXLV3 , len ( storageDisks ) )
2016-06-02 19:34:15 -04:00
2018-01-22 17:54:55 -05:00
// Load format from each disk in parallel
2019-10-14 12:44:51 -04:00
for index := range storageDisks {
index := index
g . Go ( func ( ) error {
if storageDisks [ index ] == nil {
return errDiskNotFound
}
format , err := loadFormatXL ( storageDisks [ index ] )
if err != nil {
return err
2016-06-02 19:34:15 -04:00
}
2018-01-08 17:30:55 -05:00
formats [ index ] = format
2020-03-27 17:48:30 -04:00
if ! heal {
// If no healing required, make the disks valid and
// online.
storageDisks [ index ] . SetDiskID ( format . XL . This )
}
2019-10-14 12:44:51 -04:00
return nil
} , index )
2016-06-02 19:34:15 -04:00
}
2019-10-14 12:44:51 -04:00
// Return all formats and errors if any.
return formats , g . Wait ( )
2016-06-02 19:34:15 -04:00
}
2020-03-27 17:48:30 -04:00
func saveFormatXL ( disk StorageAPI , format interface { } , diskID string ) error {
if format == nil || disk == nil {
return errDiskNotFound
}
if err := makeFormatXLMetaVolumes ( disk ) ; err != nil {
return err
}
2018-02-15 20:45:57 -05:00
// Marshal and write to disk.
formatBytes , err := json . Marshal ( format )
if err != nil {
return err
2017-08-03 07:37:02 -04:00
}
2019-12-23 19:31:03 -05:00
tmpFormat := mustGetUUID ( )
2019-09-24 21:47:26 -04:00
2018-02-15 20:45:57 -05:00
// Purge any existing temporary file, okay to ignore errors here.
2019-12-23 19:31:03 -05:00
defer disk . DeleteFile ( minioMetaBucket , tmpFormat )
2017-08-03 07:37:02 -04:00
2019-12-23 19:31:03 -05:00
// write to unique file.
if err = disk . WriteAll ( minioMetaBucket , tmpFormat , bytes . NewReader ( formatBytes ) ) ; err != nil {
2018-02-15 20:45:57 -05:00
return err
2017-08-03 07:37:02 -04:00
}
2019-09-24 21:47:26 -04:00
// Rename file `uuid.json` --> `format.json`.
2020-03-27 17:48:30 -04:00
if err = disk . RenameFile ( minioMetaBucket , tmpFormat , minioMetaBucket , formatConfigFile ) ; err != nil {
return err
}
disk . SetDiskID ( diskID )
return nil
2016-05-20 05:22:22 -04:00
}
2020-04-06 19:51:18 -04:00
var ignoredHiddenDirectories = map [ string ] struct { } {
2020-05-26 12:32:33 -04:00
minioMetaBucket : { } , // metabucket '.minio.sys'
".minio" : { } , // users may choose to double down the backend as the config folder for certs
".snapshot" : { } , // .snapshot for ignoring NetApp based persistent volumes WAFL snapshot
"lost+found" : { } , // 'lost+found' directory default on ext4 filesystems
"$RECYCLE.BIN" : { } , // windows specific directory for each drive (hidden)
"System Volume Information" : { } , // windows specific directory for each drive (hidden)
2018-11-02 14:31:55 -04:00
}
2020-04-06 19:51:18 -04:00
func isHiddenDirectories ( vols ... VolInfo ) bool {
for _ , vol := range vols {
if _ , ok := ignoredHiddenDirectories [ vol . Name ] ; ok {
continue
2018-11-02 14:31:55 -04:00
}
2020-04-06 19:51:18 -04:00
return false
2018-11-02 14:31:55 -04:00
}
2020-04-06 19:51:18 -04:00
return true
2018-11-02 14:31:55 -04:00
}
2018-02-15 20:45:57 -05:00
// loadFormatXL - loads format.json from disk.
2018-03-15 16:55:23 -04:00
func loadFormatXL ( disk StorageAPI ) ( format * formatXLV3 , err error ) {
2016-06-25 17:51:06 -04:00
buf , err := disk . ReadAll ( minioMetaBucket , formatConfigFile )
if err != nil {
2016-05-20 05:22:22 -04:00
// 'file not found' and 'volume not found' as
// same. 'volume not found' usually means its a fresh disk.
if err == errFileNotFound || err == errVolumeNotFound {
var vols [ ] VolInfo
vols , err = disk . ListVols ( )
if err != nil {
return nil , err
}
2020-04-06 19:51:18 -04:00
if ! isHiddenDirectories ( vols ... ) {
// 'format.json' not found, but we found user data, reject such disks.
2016-05-20 05:22:22 -04:00
return nil , errCorruptedFormat
}
// No other data found, its a fresh disk.
return nil , errUnformattedDisk
}
2016-05-07 03:59:43 -04:00
return nil , err
2016-05-04 15:18:20 -04:00
}
2016-06-24 05:06:23 -04:00
// Try to decode format json into formatConfigV1 struct.
2018-03-15 16:55:23 -04:00
format = & formatXLV3 { }
2016-06-25 17:51:06 -04:00
if err = json . Unmarshal ( buf , format ) ; err != nil {
2016-05-07 03:59:43 -04:00
return nil , err
2016-05-04 15:18:20 -04:00
}
2016-06-24 05:06:23 -04:00
// Success.
2016-05-20 05:22:22 -04:00
return format , nil
}
2018-02-15 20:45:57 -05:00
// Valid formatXL basic versions.
2018-03-15 16:55:23 -04:00
func checkFormatXLValue ( formatXL * formatXLV3 ) error {
2018-02-15 20:45:57 -05:00
// Validate format version and format type.
if formatXL . Version != formatMetaVersionV1 {
return fmt . Errorf ( "Unsupported version of backend format [%s] found" , formatXL . Version )
2016-07-26 06:18:47 -04:00
}
2018-02-15 20:45:57 -05:00
if formatXL . Format != formatBackendXL {
return fmt . Errorf ( "Unsupported backend format [%s] found" , formatXL . Format )
2017-08-03 07:37:02 -04:00
}
2018-03-15 16:55:23 -04:00
if formatXL . XL . Version != formatXLVersionV3 {
2018-02-15 20:45:57 -05:00
return fmt . Errorf ( "Unsupported XL backend format found [%s]" , formatXL . XL . Version )
2018-01-22 17:54:55 -05:00
}
return nil
2017-08-03 07:37:02 -04:00
}
2018-02-15 20:45:57 -05:00
// Check all format values.
2020-03-08 16:30:25 -04:00
func checkFormatXLValues ( formats [ ] * formatXLV3 , drivesPerSet int ) error {
2018-02-20 21:42:09 -05:00
for i , formatXL := range formats {
2018-02-15 20:45:57 -05:00
if formatXL == nil {
continue
}
if err := checkFormatXLValue ( formatXL ) ; err != nil {
return err
}
if len ( formats ) != len ( formatXL . XL . Sets ) * len ( formatXL . XL . Sets [ 0 ] ) {
2018-02-20 21:42:09 -05:00
return fmt . Errorf ( "%s disk is already being used in another erasure deployment. (Number of disks specified: %d but the number of disks found in the %s disk's format.json: %d)" ,
humanize . Ordinal ( i + 1 ) , len ( formats ) , humanize . Ordinal ( i + 1 ) , len ( formatXL . XL . Sets ) * len ( formatXL . XL . Sets [ 0 ] ) )
2018-02-15 20:45:57 -05:00
}
2020-04-27 17:39:57 -04:00
// Only if custom erasure drive count is set,
// we should fail here other proceed to honor what
// is present on the disk.
if globalCustomErasureDriveCount && len ( formatXL . XL . Sets [ 0 ] ) != drivesPerSet {
2020-03-08 16:30:25 -04:00
return fmt . Errorf ( "%s disk is already formatted with %d drives per erasure set. This cannot be changed to %d, please revert your MINIO_ERASURE_SET_DRIVE_COUNT setting" , humanize . Ordinal ( i + 1 ) , len ( formatXL . XL . Sets [ 0 ] ) , drivesPerSet )
}
2017-08-03 07:37:02 -04:00
}
2018-02-15 20:45:57 -05:00
return nil
}
2017-08-03 07:37:02 -04:00
2018-07-18 23:17:35 -04:00
// Get Deployment ID for the XL sets from format.json.
// This need not be in quorum. Even if one of the format.json
// file has this value, we assume it is valid.
// If more than one format.json's have different id, it is considered a corrupt
// backend format.
func formatXLGetDeploymentID ( refFormat * formatXLV3 , formats [ ] * formatXLV3 ) ( string , error ) {
var deploymentID string
for _ , format := range formats {
if format == nil || format . ID == "" {
continue
}
if reflect . DeepEqual ( format . XL . Sets , refFormat . XL . Sets ) {
// Found an ID in one of the format.json file
// Set deploymentID for the first time.
if deploymentID == "" {
deploymentID = format . ID
} else if deploymentID != format . ID {
// DeploymentID found earlier doesn't match with the
// current format.json's ID.
return "" , errCorruptedFormat
}
}
}
return deploymentID , nil
}
// formatXLFixDeploymentID - Add deployment id if it is not present.
2019-11-19 20:42:27 -05:00
func formatXLFixDeploymentID ( endpoints Endpoints , storageDisks [ ] StorageAPI , refFormat * formatXLV3 ) ( err error ) {
2018-07-18 23:17:35 -04:00
// Attempt to load all `format.json` from all disks.
var sErrs [ ] error
2020-03-27 17:48:30 -04:00
formats , sErrs := loadFormatXLAll ( storageDisks , false )
2018-07-18 23:17:35 -04:00
for i , sErr := range sErrs {
if _ , ok := formatCriticalErrors [ sErr ] ; ok {
2020-05-26 12:32:33 -04:00
return config . ErrCorruptedBackend ( err ) . Hint ( fmt . Sprintf ( "Clear any pre-existing content on %s" , endpoints [ i ] ) )
2018-07-18 23:17:35 -04:00
}
}
for index := range formats {
// If the XL sets do not match, set those formats to nil,
// We do not have to update the ID on those format.json file.
if formats [ index ] != nil && ! reflect . DeepEqual ( formats [ index ] . XL . Sets , refFormat . XL . Sets ) {
formats [ index ] = nil
}
}
refFormat . ID , err = formatXLGetDeploymentID ( refFormat , formats )
if err != nil {
return err
}
// If ID is set, then some other node got the lock
// before this node could and generated an ID
// for the deployment. No need to generate one.
if refFormat . ID != "" {
return nil
}
// ID is generated for the first time,
// We set the ID in all the formats and update.
refFormat . ID = mustGetUUID ( )
for _ , format := range formats {
if format != nil {
format . ID = refFormat . ID
}
}
// Deployment ID needs to be set on all the disks.
// Save `format.json` across all disks.
2020-04-09 12:30:02 -04:00
return saveFormatXLAll ( GlobalContext , storageDisks , formats )
2018-07-18 23:17:35 -04:00
}
// Update only the valid local disks which have not been updated before.
2019-11-19 20:42:27 -05:00
func formatXLFixLocalDeploymentID ( endpoints Endpoints , storageDisks [ ] StorageAPI , refFormat * formatXLV3 ) error {
2018-07-18 23:17:35 -04:00
// If this server was down when the deploymentID was updated
// then we make sure that we update the local disks with the deploymentID.
2020-03-27 17:48:30 -04:00
// Initialize errs to collect errors inside go-routine.
g := errgroup . WithNErrs ( len ( storageDisks ) )
for index := range storageDisks {
index := index
g . Go ( func ( ) error {
if endpoints [ index ] . IsLocal && storageDisks [ index ] != nil && storageDisks [ index ] . IsOnline ( ) {
format , err := loadFormatXL ( storageDisks [ index ] )
if err != nil {
// Disk can be offline etc.
// ignore the errors seen here.
return nil
}
if format . ID != "" {
return nil
}
if ! reflect . DeepEqual ( format . XL . Sets , refFormat . XL . Sets ) {
return nil
}
format . ID = refFormat . ID
if err := saveFormatXL ( storageDisks [ index ] , format , format . XL . This ) ; err != nil {
2020-04-09 12:30:02 -04:00
logger . LogIf ( GlobalContext , err )
2020-03-27 17:48:30 -04:00
return fmt . Errorf ( "Unable to save format.json, %w" , err )
}
2018-07-18 23:17:35 -04:00
}
2020-03-27 17:48:30 -04:00
return nil
} , index )
}
for _ , err := range g . Wait ( ) {
if err != nil {
return err
2018-07-18 23:17:35 -04:00
}
}
return nil
}
2018-02-15 20:45:57 -05:00
// Get backend XL format in quorum `format.json`.
2018-03-15 16:55:23 -04:00
func getFormatXLInQuorum ( formats [ ] * formatXLV3 ) ( * formatXLV3 , error ) {
2018-02-15 20:45:57 -05:00
formatHashes := make ( [ ] string , len ( formats ) )
for i , format := range formats {
if format == nil {
2018-01-22 17:54:55 -05:00
continue
}
2018-02-15 20:45:57 -05:00
h := sha256 . New ( )
for _ , set := range format . XL . Sets {
for _ , diskID := range set {
h . Write ( [ ] byte ( diskID ) )
2016-06-22 20:18:31 -04:00
}
2016-06-01 19:15:56 -04:00
}
2018-02-15 20:45:57 -05:00
formatHashes [ i ] = hex . EncodeToString ( h . Sum ( nil ) )
2016-06-01 19:15:56 -04:00
}
2016-07-26 06:18:47 -04:00
2018-02-15 20:45:57 -05:00
formatCountMap := make ( map [ string ] int )
for _ , hash := range formatHashes {
if hash == "" {
continue
}
formatCountMap [ hash ] ++
}
2016-06-01 19:15:56 -04:00
2018-02-15 20:45:57 -05:00
maxHash := ""
maxCount := 0
for hash , count := range formatCountMap {
if count > maxCount {
maxCount = count
maxHash = hash
2016-07-28 19:49:59 -04:00
}
2018-02-15 20:45:57 -05:00
}
if maxCount < len ( formats ) / 2 {
return nil , errXLReadQuorum
}
for i , hash := range formatHashes {
if hash == maxHash {
2019-11-21 07:24:51 -05:00
format := formats [ i ] . Clone ( )
2018-02-15 20:45:57 -05:00
format . XL . This = ""
2019-11-21 07:24:51 -05:00
return format , nil
2016-07-28 19:49:59 -04:00
}
}
2018-02-15 20:45:57 -05:00
return nil , errXLReadQuorum
2016-07-28 19:49:59 -04:00
}
2018-03-15 16:55:23 -04:00
func formatXLV3Check ( reference * formatXLV3 , format * formatXLV3 ) error {
2019-11-21 07:24:51 -05:00
tmpFormat := format . Clone ( )
2018-02-15 20:45:57 -05:00
this := tmpFormat . XL . This
tmpFormat . XL . This = ""
if len ( reference . XL . Sets ) != len ( format . XL . Sets ) {
return fmt . Errorf ( "Expected number of sets %d, got %d" , len ( reference . XL . Sets ) , len ( format . XL . Sets ) )
}
2017-08-03 07:37:02 -04:00
2018-02-15 20:45:57 -05:00
// Make sure that the sets match.
for i := range reference . XL . Sets {
if len ( reference . XL . Sets [ i ] ) != len ( format . XL . Sets [ i ] ) {
return fmt . Errorf ( "Each set should be of same size, expected %d got %d" ,
len ( reference . XL . Sets [ i ] ) , len ( format . XL . Sets [ i ] ) )
2016-07-28 19:49:59 -04:00
}
2018-02-15 20:45:57 -05:00
for j := range reference . XL . Sets [ i ] {
if reference . XL . Sets [ i ] [ j ] != format . XL . Sets [ i ] [ j ] {
return fmt . Errorf ( "UUID on positions %d:%d do not match with, expected %s got %s" ,
i , j , reference . XL . Sets [ i ] [ j ] , format . XL . Sets [ i ] [ j ] )
2016-07-28 19:49:59 -04:00
}
}
2018-02-15 20:45:57 -05:00
}
// Make sure that the diskID is found in the set.
for i := 0 ; i < len ( tmpFormat . XL . Sets ) ; i ++ {
for j := 0 ; j < len ( tmpFormat . XL . Sets [ i ] ) ; j ++ {
if this == tmpFormat . XL . Sets [ i ] [ j ] {
return nil
2016-07-28 19:49:59 -04:00
}
}
}
2018-02-15 20:45:57 -05:00
return fmt . Errorf ( "Disk ID %s not found in any disk sets %s" , this , format . XL . Sets )
2016-07-28 19:49:59 -04:00
}
2020-01-15 15:36:52 -05:00
// Initializes meta volume only on local storage disks.
func initXLMetaVolumesInLocalDisks ( storageDisks [ ] StorageAPI , formats [ ] * formatXLV3 ) error {
// Compute the local disks eligible for meta volumes (re)initialization
var disksToInit [ ] StorageAPI
for index := range storageDisks {
2020-05-19 17:27:20 -04:00
if formats [ index ] == nil || storageDisks [ index ] == nil || ! storageDisks [ index ] . IsLocal ( ) {
2020-01-15 15:36:52 -05:00
// Ignore create meta volume on disks which are not found or not local.
continue
}
disksToInit = append ( disksToInit , storageDisks [ index ] )
}
2019-12-23 19:31:03 -05:00
// Initialize errs to collect errors inside go-routine.
2020-01-15 15:36:52 -05:00
g := errgroup . WithNErrs ( len ( disksToInit ) )
2019-12-23 19:31:03 -05:00
// Initialize all disks in parallel.
2020-01-15 15:36:52 -05:00
for index := range disksToInit {
// Initialize a new index variable in each loop so each
// goroutine will return its own instance of index variable.
2019-12-23 19:31:03 -05:00
index := index
g . Go ( func ( ) error {
2020-02-06 16:12:36 -05:00
return makeFormatXLMetaVolumes ( disksToInit [ index ] )
2019-12-23 19:31:03 -05:00
} , index )
}
// Return upon first error.
for _ , err := range g . Wait ( ) {
if err == nil {
continue
}
return toObjectErr ( err , minioMetaBucket )
}
// Return success here.
return nil
}
2018-02-15 20:45:57 -05:00
// saveFormatXLAll - populates `format.json` on disks in its order.
2018-04-05 18:04:40 -04:00
func saveFormatXLAll ( ctx context . Context , storageDisks [ ] StorageAPI , formats [ ] * formatXLV3 ) error {
2019-10-14 12:44:51 -04:00
g := errgroup . WithNErrs ( len ( storageDisks ) )
2016-07-28 19:49:59 -04:00
2018-02-15 20:45:57 -05:00
// Write `format.json` to all disks.
2019-10-14 12:44:51 -04:00
for index := range storageDisks {
index := index
g . Go ( func ( ) error {
2020-03-27 17:48:30 -04:00
return saveFormatXL ( storageDisks [ index ] , formats [ index ] , formats [ index ] . XL . This )
2019-10-14 12:44:51 -04:00
} , index )
2016-07-28 19:49:59 -04:00
}
2020-03-31 12:32:16 -04:00
writeQuorum := getWriteQuorum ( len ( storageDisks ) )
2019-10-14 12:44:51 -04:00
// Wait for the routines to finish.
return reduceWriteQuorumErrs ( ctx , g . Wait ( ) , nil , writeQuorum )
2018-02-15 20:45:57 -05:00
}
2018-04-04 00:58:48 -04:00
// relinquishes the underlying connection for all storage disks.
func closeStorageDisks ( storageDisks [ ] StorageAPI ) {
for _ , disk := range storageDisks {
if disk == nil {
continue
}
disk . Close ( )
}
}
2019-09-27 19:47:12 -04:00
// Initialize storage disks for each endpoint.
// Errors are returned for each endpoint with matching index.
2019-11-19 20:42:27 -05:00
func initStorageDisksWithErrors ( endpoints Endpoints ) ( [ ] StorageAPI , [ ] error ) {
2018-02-15 20:45:57 -05:00
// Bootstrap disks.
storageDisks := make ( [ ] StorageAPI , len ( endpoints ) )
2019-10-14 12:44:51 -04:00
g := errgroup . WithNErrs ( len ( endpoints ) )
for index := range endpoints {
index := index
g . Go ( func ( ) error {
storageDisk , err := newStorageAPI ( endpoints [ index ] )
if err != nil {
return err
}
storageDisks [ index ] = storageDisk
return nil
} , index )
2019-08-02 15:17:26 -04:00
}
2019-10-14 12:44:51 -04:00
return storageDisks , g . Wait ( )
2019-08-02 15:17:26 -04:00
}
2018-03-19 12:13:00 -04:00
// formatXLV3ThisEmpty - find out if '.This' field is empty
// in any of the input `formats`, if yes return true.
func formatXLV3ThisEmpty ( formats [ ] * formatXLV3 ) bool {
for _ , format := range formats {
if format == nil {
continue
}
// NOTE: This code is specifically needed when migrating version
// V1 to V2 to V3, in a scenario such as this we only need to handle
// single sets since we never used to support multiple sets in releases
// with V1 format version.
if len ( format . XL . Sets ) > 1 {
continue
}
if format . XL . This == "" {
return true
}
}
return false
}
// fixFormatXLV3 - fix format XL configuration on all disks.
2019-11-19 20:42:27 -05:00
func fixFormatXLV3 ( storageDisks [ ] StorageAPI , endpoints Endpoints , formats [ ] * formatXLV3 ) error {
2020-03-27 17:48:30 -04:00
g := errgroup . WithNErrs ( len ( formats ) )
for i := range formats {
i := i
g . Go ( func ( ) error {
if formats [ i ] == nil || ! endpoints [ i ] . IsLocal {
return nil
}
// NOTE: This code is specifically needed when migrating version
// V1 to V2 to V3, in a scenario such as this we only need to handle
// single sets since we never used to support multiple sets in releases
// with V1 format version.
if len ( formats [ i ] . XL . Sets ) > 1 {
return nil
}
if formats [ i ] . XL . This == "" {
formats [ i ] . XL . This = formats [ i ] . XL . Sets [ 0 ] [ i ]
if err := saveFormatXL ( storageDisks [ i ] , formats [ i ] , formats [ i ] . XL . This ) ; err != nil {
return err
}
2018-03-19 12:13:00 -04:00
}
2020-03-27 17:48:30 -04:00
return nil
} , i )
}
for _ , err := range g . Wait ( ) {
if err != nil {
return err
2018-03-19 12:13:00 -04:00
}
}
return nil
2020-03-27 17:48:30 -04:00
2018-03-19 12:13:00 -04:00
}
2018-02-15 20:45:57 -05:00
// initFormatXL - save XL format configuration on all disks.
2019-11-21 07:24:51 -05:00
func initFormatXL ( ctx context . Context , storageDisks [ ] StorageAPI , setCount , drivesPerSet int , deploymentID string ) ( * formatXLV3 , error ) {
format := newFormatXLV3 ( setCount , drivesPerSet )
2018-04-04 00:58:48 -04:00
formats := make ( [ ] * formatXLV3 , len ( storageDisks ) )
2020-01-13 16:09:10 -05:00
wantAtMost := ecDrivesNoConfig ( drivesPerSet )
2016-05-04 15:18:20 -04:00
2018-02-15 20:45:57 -05:00
for i := 0 ; i < setCount ; i ++ {
2020-01-13 16:09:10 -05:00
hostCount := make ( map [ string ] int , drivesPerSet )
2019-11-21 07:24:51 -05:00
for j := 0 ; j < drivesPerSet ; j ++ {
2020-01-13 16:09:10 -05:00
disk := storageDisks [ i * drivesPerSet + j ]
2019-11-21 07:24:51 -05:00
newFormat := format . Clone ( )
2018-02-15 20:45:57 -05:00
newFormat . XL . This = format . XL . Sets [ i ] [ j ]
2019-11-20 05:09:30 -05:00
if deploymentID != "" {
newFormat . ID = deploymentID
}
2020-01-13 16:09:10 -05:00
hostCount [ disk . Hostname ( ) ] ++
2019-11-21 07:24:51 -05:00
formats [ i * drivesPerSet + j ] = newFormat
2018-02-15 20:45:57 -05:00
}
2020-01-13 16:09:10 -05:00
if len ( hostCount ) > 0 {
var once sync . Once
for host , count := range hostCount {
if count > wantAtMost {
if host == "" {
host = "local"
}
once . Do ( func ( ) {
if len ( hostCount ) == 1 {
return
}
logger . Info ( " * Set %v:" , i + 1 )
for j := 0 ; j < drivesPerSet ; j ++ {
disk := storageDisks [ i * drivesPerSet + j ]
logger . Info ( " - Drive: %s" , disk . String ( ) )
}
} )
logger . Info ( color . Yellow ( "WARNING:" ) + " Host %v has more than %v drives of set. " +
"A host failure will result in data becoming unavailable." , host , wantAtMost )
}
}
}
2016-05-04 15:18:20 -04:00
}
2018-02-15 20:45:57 -05:00
// Save formats `format.json` across all disks.
2019-11-21 07:24:51 -05:00
if err := saveFormatXLAll ( ctx , storageDisks , formats ) ; err != nil {
2018-02-15 20:45:57 -05:00
return nil , err
2017-04-18 13:35:17 -04:00
}
2018-02-15 20:45:57 -05:00
2019-11-21 07:24:51 -05:00
return getFormatXLInQuorum ( formats )
2017-04-18 13:35:17 -04:00
}
2020-01-13 16:09:10 -05:00
// ecDrivesNoConfig returns the erasure coded drives in a set if no config has been set.
// It will attempt to read it from env variable and fall back to drives/2.
func ecDrivesNoConfig ( drivesPerSet int ) int {
ecDrives := globalStorageClass . GetParityForSC ( storageclass . STANDARD )
if ecDrives == 0 {
cfg , err := storageclass . LookupConfig ( nil , drivesPerSet )
if err == nil {
ecDrives = cfg . Standard . Parity
}
if ecDrives == 0 {
ecDrives = drivesPerSet / 2
}
}
return ecDrives
}
2018-02-15 20:45:57 -05:00
// Make XL backend meta volumes.
func makeFormatXLMetaVolumes ( disk StorageAPI ) error {
2020-03-27 17:48:30 -04:00
if disk == nil {
return errDiskNotFound
}
2019-12-23 19:31:03 -05:00
// Attempt to create MinIO internal buckets.
2020-03-18 19:19:29 -04:00
return disk . MakeVolBulk ( minioMetaBucket , minioMetaTmpBucket , minioMetaMultipartBucket , dataUsageBucket )
2016-12-11 18:18:55 -05:00
}
2018-02-15 20:45:57 -05:00
// Get all UUIDs which are present in reference format should
// be present in the list of formats provided, those are considered
// as online UUIDs.
2018-03-15 16:55:23 -04:00
func getOnlineUUIDs ( refFormat * formatXLV3 , formats [ ] * formatXLV3 ) ( onlineUUIDs [ ] string ) {
2018-02-15 20:45:57 -05:00
for _ , format := range formats {
if format == nil {
continue
}
for _ , set := range refFormat . XL . Sets {
for _ , uuid := range set {
if format . XL . This == uuid {
onlineUUIDs = append ( onlineUUIDs , uuid )
}
}
}
2016-05-07 03:59:43 -04:00
}
2018-02-15 20:45:57 -05:00
return onlineUUIDs
}
2016-06-22 20:18:31 -04:00
2018-02-15 20:45:57 -05:00
// Look for all UUIDs which are not present in reference format
// but are present in the onlineUUIDs list, construct of list such
// offline UUIDs.
2018-03-15 16:55:23 -04:00
func getOfflineUUIDs ( refFormat * formatXLV3 , formats [ ] * formatXLV3 ) ( offlineUUIDs [ ] string ) {
2018-02-15 20:45:57 -05:00
onlineUUIDs := getOnlineUUIDs ( refFormat , formats )
for i , set := range refFormat . XL . Sets {
for j , uuid := range set {
var found bool
for _ , onlineUUID := range onlineUUIDs {
if refFormat . XL . Sets [ i ] [ j ] == onlineUUID {
found = true
}
}
if ! found {
offlineUUIDs = append ( offlineUUIDs , uuid )
}
}
2016-05-04 15:18:20 -04:00
}
2018-02-15 20:45:57 -05:00
return offlineUUIDs
2018-01-08 17:30:55 -05:00
}
2018-02-15 20:45:57 -05:00
// Mark all UUIDs that are offline.
2018-03-15 16:55:23 -04:00
func markUUIDsOffline ( refFormat * formatXLV3 , formats [ ] * formatXLV3 ) {
2018-02-15 20:45:57 -05:00
offlineUUIDs := getOfflineUUIDs ( refFormat , formats )
for i , set := range refFormat . XL . Sets {
for j := range set {
for _ , offlineUUID := range offlineUUIDs {
if refFormat . XL . Sets [ i ] [ j ] == offlineUUID {
refFormat . XL . Sets [ i ] [ j ] = offlineDiskUUID
}
}
}
2016-08-30 22:22:27 -04:00
}
2018-02-15 20:45:57 -05:00
}
2016-08-30 22:22:27 -04:00
2018-02-15 20:45:57 -05:00
// Initialize a new set of set formats which will be written to all disks.
2019-11-21 07:24:51 -05:00
func newHealFormatSets ( refFormat * formatXLV3 , setCount , drivesPerSet int , formats [ ] * formatXLV3 , errs [ ] error ) [ ] [ ] * formatXLV3 {
2018-03-15 16:55:23 -04:00
newFormats := make ( [ ] [ ] * formatXLV3 , setCount )
2018-02-15 20:45:57 -05:00
for i := range refFormat . XL . Sets {
2019-11-21 07:24:51 -05:00
newFormats [ i ] = make ( [ ] * formatXLV3 , drivesPerSet )
2018-02-15 20:45:57 -05:00
}
for i := range refFormat . XL . Sets {
for j := range refFormat . XL . Sets [ i ] {
2019-11-21 07:24:51 -05:00
if errs [ i * drivesPerSet + j ] == errUnformattedDisk || errs [ i * drivesPerSet + j ] == nil {
2018-03-15 16:55:23 -04:00
newFormats [ i ] [ j ] = & formatXLV3 { }
2018-02-15 20:45:57 -05:00
newFormats [ i ] [ j ] . Version = refFormat . Version
2019-01-22 21:32:06 -05:00
newFormats [ i ] [ j ] . ID = refFormat . ID
2018-02-15 20:45:57 -05:00
newFormats [ i ] [ j ] . Format = refFormat . Format
newFormats [ i ] [ j ] . XL . Version = refFormat . XL . Version
newFormats [ i ] [ j ] . XL . DistributionAlgo = refFormat . XL . DistributionAlgo
}
2019-11-21 07:24:51 -05:00
if errs [ i * drivesPerSet + j ] == errUnformattedDisk {
2018-02-15 20:45:57 -05:00
newFormats [ i ] [ j ] . XL . This = ""
newFormats [ i ] [ j ] . XL . Sets = nil
continue
}
2019-11-21 07:24:51 -05:00
if errs [ i * drivesPerSet + j ] == nil {
newFormats [ i ] [ j ] . XL . This = formats [ i * drivesPerSet + j ] . XL . This
2018-02-15 20:45:57 -05:00
newFormats [ i ] [ j ] . XL . Sets = nil
}
}
}
return newFormats
2016-05-04 15:18:20 -04:00
}