2016-08-30 19:22:27 -07:00
|
|
|
/*
|
2019-04-09 11:39:42 -07:00
|
|
|
* MinIO Cloud Storage, (C) 2016 MinIO, Inc.
|
2016-08-30 19:22:27 -07:00
|
|
|
*
|
|
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
|
|
* you may not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
package cmd
|
|
|
|
|
|
|
|
import (
|
2020-08-04 14:55:53 -07:00
|
|
|
"context"
|
2020-01-14 18:45:17 -08:00
|
|
|
"crypto/tls"
|
2017-06-17 11:20:12 -07:00
|
|
|
"fmt"
|
2020-01-14 18:45:17 -08:00
|
|
|
"net/http"
|
|
|
|
"net/url"
|
2018-02-15 17:45:57 -08:00
|
|
|
"os"
|
2020-01-14 18:45:17 -08:00
|
|
|
"path"
|
2019-10-30 00:04:39 -07:00
|
|
|
"sync"
|
2016-08-30 19:22:27 -07:00
|
|
|
"time"
|
|
|
|
|
2020-05-13 20:25:29 -07:00
|
|
|
"github.com/dustin/go-humanize"
|
2020-01-14 18:45:17 -08:00
|
|
|
xhttp "github.com/minio/minio/cmd/http"
|
2018-04-05 15:04:40 -07:00
|
|
|
"github.com/minio/minio/cmd/logger"
|
2019-01-26 01:33:28 +04:00
|
|
|
"github.com/minio/minio/pkg/sync/errgroup"
|
2016-08-30 19:22:27 -07:00
|
|
|
)
|
|
|
|
|
2020-07-17 10:08:04 -07:00
|
|
|
var printEndpointError = func() func(Endpoint, error, bool) {
|
2019-10-30 00:04:39 -07:00
|
|
|
var mutex sync.Mutex
|
2020-07-17 10:08:04 -07:00
|
|
|
printOnce := make(map[Endpoint]map[string]int)
|
2018-02-15 17:45:57 -08:00
|
|
|
|
2020-07-17 10:08:04 -07:00
|
|
|
return func(endpoint Endpoint, err error, once bool) {
|
2018-09-13 21:42:50 -07:00
|
|
|
reqInfo := (&logger.ReqInfo{}).AppendTags("endpoint", endpoint.String())
|
2020-04-09 09:30:02 -07:00
|
|
|
ctx := logger.SetReqInfo(GlobalContext, reqInfo)
|
2019-10-30 00:04:39 -07:00
|
|
|
mutex.Lock()
|
|
|
|
defer mutex.Unlock()
|
2020-07-17 10:08:04 -07:00
|
|
|
|
2018-02-15 17:45:57 -08:00
|
|
|
m, ok := printOnce[endpoint]
|
|
|
|
if !ok {
|
2020-07-17 10:08:04 -07:00
|
|
|
m = make(map[string]int)
|
|
|
|
m[err.Error()]++
|
2018-02-15 17:45:57 -08:00
|
|
|
printOnce[endpoint] = m
|
2020-07-17 10:08:04 -07:00
|
|
|
if once {
|
|
|
|
logger.LogAlwaysIf(ctx, err)
|
|
|
|
return
|
|
|
|
}
|
2017-12-28 18:32:48 +01:00
|
|
|
}
|
2020-07-17 10:08:04 -07:00
|
|
|
// Once is set and we are here means error was already
|
|
|
|
// printed once.
|
|
|
|
if once {
|
2018-02-15 17:45:57 -08:00
|
|
|
return
|
2017-12-28 18:32:48 +01:00
|
|
|
}
|
2020-07-17 10:08:04 -07:00
|
|
|
// once not set, check if same error occurred 3 times in
|
|
|
|
// a row, then make sure we print it to call attention.
|
|
|
|
if m[err.Error()] > 2 {
|
|
|
|
logger.LogAlwaysIf(ctx, fmt.Errorf("Following error has been printed %d times.. %w", m[err.Error()], err))
|
|
|
|
// Reduce the count to introduce further delay in printing
|
|
|
|
// but let it again print after the 2th attempt
|
|
|
|
m[err.Error()]--
|
|
|
|
m[err.Error()]--
|
|
|
|
}
|
|
|
|
m[err.Error()]++
|
2017-12-28 18:32:48 +01:00
|
|
|
}
|
2018-02-15 17:45:57 -08:00
|
|
|
}()
|
2016-08-30 19:22:27 -07:00
|
|
|
|
2018-03-15 13:55:23 -07:00
|
|
|
// Migrates backend format of local disks.
|
2020-06-12 20:04:01 -07:00
|
|
|
func formatErasureMigrateLocalEndpoints(endpoints Endpoints) error {
|
2019-01-26 01:33:28 +04:00
|
|
|
g := errgroup.WithNErrs(len(endpoints))
|
|
|
|
for index, endpoint := range endpoints {
|
2018-02-15 17:45:57 -08:00
|
|
|
if !endpoint.IsLocal {
|
|
|
|
continue
|
2016-08-30 19:22:27 -07:00
|
|
|
}
|
2019-01-26 01:33:28 +04:00
|
|
|
index := index
|
|
|
|
g.Go(func() error {
|
|
|
|
epPath := endpoints[index].Path
|
|
|
|
formatPath := pathJoin(epPath, minioMetaBucket, formatConfigFile)
|
|
|
|
if _, err := os.Stat(formatPath); err != nil {
|
|
|
|
if os.IsNotExist(err) {
|
|
|
|
return nil
|
|
|
|
}
|
2019-12-02 09:28:01 -08:00
|
|
|
return fmt.Errorf("unable to access (%s) %w", formatPath, err)
|
2018-02-15 17:45:57 -08:00
|
|
|
}
|
2020-06-12 20:04:01 -07:00
|
|
|
return formatErasureMigrate(epPath)
|
2019-01-26 01:33:28 +04:00
|
|
|
}, index)
|
|
|
|
}
|
|
|
|
for _, err := range g.Wait() {
|
|
|
|
if err != nil {
|
2018-02-15 17:45:57 -08:00
|
|
|
return err
|
2016-11-23 15:48:10 -08:00
|
|
|
}
|
|
|
|
}
|
2018-02-15 17:45:57 -08:00
|
|
|
return nil
|
2016-11-23 15:48:10 -08:00
|
|
|
}
|
|
|
|
|
2018-03-15 13:55:23 -07:00
|
|
|
// Cleans up tmp directory of local disks.
|
2020-06-12 20:04:01 -07:00
|
|
|
func formatErasureCleanupTmpLocalEndpoints(endpoints Endpoints) error {
|
2019-01-26 01:33:28 +04:00
|
|
|
g := errgroup.WithNErrs(len(endpoints))
|
|
|
|
for index, endpoint := range endpoints {
|
2018-03-15 13:55:23 -07:00
|
|
|
if !endpoint.IsLocal {
|
|
|
|
continue
|
|
|
|
}
|
2019-01-26 01:33:28 +04:00
|
|
|
index := index
|
|
|
|
g.Go(func() error {
|
|
|
|
epPath := endpoints[index].Path
|
|
|
|
// If disk is not formatted there is nothing to be cleaned up.
|
|
|
|
formatPath := pathJoin(epPath, minioMetaBucket, formatConfigFile)
|
|
|
|
if _, err := os.Stat(formatPath); err != nil {
|
|
|
|
if os.IsNotExist(err) {
|
|
|
|
return nil
|
|
|
|
}
|
2019-12-02 09:28:01 -08:00
|
|
|
return fmt.Errorf("unable to access (%s) %w", formatPath, err)
|
2018-03-15 13:55:23 -07:00
|
|
|
}
|
2019-01-26 01:33:28 +04:00
|
|
|
if _, err := os.Stat(pathJoin(epPath, minioMetaTmpBucket+"-old")); err != nil {
|
|
|
|
if !os.IsNotExist(err) {
|
2019-12-02 09:28:01 -08:00
|
|
|
return fmt.Errorf("unable to access (%s) %w",
|
2019-08-05 11:41:29 -07:00
|
|
|
pathJoin(epPath, minioMetaTmpBucket+"-old"),
|
|
|
|
err)
|
2019-01-26 01:33:28 +04:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Need to move temporary objects left behind from previous run of minio
|
|
|
|
// server to a unique directory under `minioMetaTmpBucket-old` to clean
|
|
|
|
// up `minioMetaTmpBucket` for the current run.
|
|
|
|
//
|
|
|
|
// /disk1/.minio.sys/tmp-old/
|
|
|
|
// |__ 33a58b40-aecc-4c9f-a22f-ff17bfa33b62
|
|
|
|
// |__ e870a2c1-d09c-450c-a69c-6eaa54a89b3e
|
|
|
|
//
|
|
|
|
// In this example, `33a58b40-aecc-4c9f-a22f-ff17bfa33b62` directory contains
|
|
|
|
// temporary objects from one of the previous runs of minio server.
|
2019-08-05 11:41:29 -07:00
|
|
|
tmpOld := pathJoin(epPath, minioMetaTmpBucket+"-old", mustGetUUID())
|
2019-01-26 01:33:28 +04:00
|
|
|
if err := renameAll(pathJoin(epPath, minioMetaTmpBucket),
|
2019-08-05 11:41:29 -07:00
|
|
|
tmpOld); err != nil && err != errFileNotFound {
|
2019-12-02 09:28:01 -08:00
|
|
|
return fmt.Errorf("unable to rename (%s -> %s) %w",
|
2019-08-05 11:41:29 -07:00
|
|
|
pathJoin(epPath, minioMetaTmpBucket),
|
|
|
|
tmpOld,
|
|
|
|
err)
|
2019-01-26 01:33:28 +04:00
|
|
|
}
|
|
|
|
|
|
|
|
// Removal of tmp-old folder is backgrounded completely.
|
|
|
|
go removeAll(pathJoin(epPath, minioMetaTmpBucket+"-old"))
|
|
|
|
|
2019-08-05 11:41:29 -07:00
|
|
|
if err := mkdirAll(pathJoin(epPath, minioMetaTmpBucket), 0777); err != nil {
|
2019-12-02 09:28:01 -08:00
|
|
|
return fmt.Errorf("unable to create (%s) %w",
|
2019-08-05 11:41:29 -07:00
|
|
|
pathJoin(epPath, minioMetaTmpBucket),
|
|
|
|
err)
|
|
|
|
}
|
|
|
|
return nil
|
2019-01-26 01:33:28 +04:00
|
|
|
}, index)
|
|
|
|
}
|
|
|
|
for _, err := range g.Wait() {
|
|
|
|
if err != nil {
|
2018-03-15 13:55:23 -07:00
|
|
|
return err
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2018-04-03 23:58:48 -05:00
|
|
|
// Following error message is added to fix a regression in release
|
|
|
|
// RELEASE.2018-03-16T22-52-12Z after migrating v1 to v2 to v3. This
|
|
|
|
// migration failed to capture '.This' field properly which indicates
|
|
|
|
// the disk UUID association. Below error message is returned when
|
|
|
|
// we see this situation in format.json, for more info refer
|
|
|
|
// https://github.com/minio/minio/issues/5667
|
2020-06-12 20:04:01 -07:00
|
|
|
var errErasureV3ThisEmpty = fmt.Errorf("Erasure format version 3 has This field empty")
|
2018-04-03 23:58:48 -05:00
|
|
|
|
2020-01-14 18:45:17 -08:00
|
|
|
// IsServerResolvable - checks if the endpoint is resolvable
|
|
|
|
// by sending a naked HTTP request with liveness checks.
|
|
|
|
func IsServerResolvable(endpoint Endpoint) error {
|
|
|
|
serverURL := &url.URL{
|
|
|
|
Scheme: endpoint.Scheme,
|
|
|
|
Host: endpoint.Host,
|
|
|
|
Path: path.Join(healthCheckPathPrefix, healthCheckLivenessPath),
|
|
|
|
}
|
|
|
|
|
|
|
|
var tlsConfig *tls.Config
|
|
|
|
if globalIsSSL {
|
|
|
|
tlsConfig = &tls.Config{
|
|
|
|
ServerName: endpoint.Hostname(),
|
|
|
|
RootCAs: globalRootCAs,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
req, err := http.NewRequest(http.MethodGet, serverURL.String(), nil)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
httpClient := &http.Client{
|
2020-07-13 09:51:07 -07:00
|
|
|
Transport:
|
|
|
|
// For more details about various values used here refer
|
|
|
|
// https://golang.org/pkg/net/http/#Transport documentation
|
|
|
|
&http.Transport{
|
|
|
|
Proxy: http.ProxyFromEnvironment,
|
|
|
|
DialContext: xhttp.NewCustomDialContext(3 * time.Second),
|
|
|
|
ResponseHeaderTimeout: 5 * time.Second,
|
|
|
|
TLSHandshakeTimeout: 5 * time.Second,
|
|
|
|
ExpectContinueTimeout: 5 * time.Second,
|
|
|
|
TLSClientConfig: tlsConfig,
|
|
|
|
// Go net/http automatically unzip if content-type is
|
|
|
|
// gzip disable this feature, as we are always interested
|
|
|
|
// in raw stream.
|
|
|
|
DisableCompression: true,
|
|
|
|
},
|
2020-01-14 18:45:17 -08:00
|
|
|
}
|
2020-04-17 20:20:56 +02:00
|
|
|
defer httpClient.CloseIdleConnections()
|
2020-01-14 18:45:17 -08:00
|
|
|
|
2020-08-04 14:55:53 -07:00
|
|
|
ctx, cancel := context.WithTimeout(GlobalContext, 5*time.Second)
|
|
|
|
defer cancel()
|
|
|
|
|
|
|
|
resp, err := httpClient.Do(req.WithContext(ctx))
|
2020-01-14 18:45:17 -08:00
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
defer xhttp.DrainBody(resp.Body)
|
|
|
|
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
|
|
|
return StorageErr(resp.Status)
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// connect to list of endpoints and load all Erasure disk formats, validate the formats are correct
|
2018-04-03 23:58:48 -05:00
|
|
|
// and are in quorum, if no formats are found attempt to initialize all of them for the first
|
|
|
|
// time. additionally make sure to close all the disks used in this attempt.
|
2020-06-12 20:04:01 -07:00
|
|
|
func connectLoadInitFormats(retryCount int, firstDisk bool, endpoints Endpoints, zoneCount, setCount, drivesPerSet int, deploymentID string) (storageDisks []StorageAPI, format *formatErasureV3, err error) {
|
2018-09-11 00:21:59 +01:00
|
|
|
// Initialize all storage disks
|
2019-09-27 16:47:12 -07:00
|
|
|
storageDisks, errs := initStorageDisksWithErrors(endpoints)
|
2020-01-14 18:45:17 -08:00
|
|
|
|
2020-04-03 18:06:31 -07:00
|
|
|
defer func(storageDisks []StorageAPI) {
|
|
|
|
if err != nil {
|
|
|
|
closeStorageDisks(storageDisks)
|
|
|
|
}
|
|
|
|
}(storageDisks)
|
|
|
|
|
2019-09-27 16:47:12 -07:00
|
|
|
for i, err := range errs {
|
2020-01-14 18:45:17 -08:00
|
|
|
if err != nil {
|
|
|
|
if err != errDiskNotFound {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, fmt.Errorf("Disk %s: %w", endpoints[i], err)
|
2020-01-14 18:45:17 -08:00
|
|
|
}
|
|
|
|
if retryCount >= 5 {
|
|
|
|
logger.Info("Unable to connect to %s: %v\n", endpoints[i], IsServerResolvable(endpoints[i]))
|
|
|
|
}
|
2019-09-27 16:47:12 -07:00
|
|
|
}
|
|
|
|
}
|
2018-04-03 23:58:48 -05:00
|
|
|
|
2018-12-04 10:25:56 -08:00
|
|
|
// Attempt to load all `format.json` from all disks.
|
2020-06-12 20:04:01 -07:00
|
|
|
formatConfigs, sErrs := loadFormatErasureAll(storageDisks, false)
|
2018-12-04 10:25:56 -08:00
|
|
|
// Check if we have
|
|
|
|
for i, sErr := range sErrs {
|
2020-08-03 18:17:48 -07:00
|
|
|
// print the error, nonetheless, which is perhaps unhandled
|
2020-03-08 12:12:07 -07:00
|
|
|
if sErr != errUnformattedDisk && sErr != errDiskNotFound && retryCount >= 5 {
|
2020-03-23 07:32:18 -07:00
|
|
|
if sErr != nil {
|
|
|
|
logger.Info("Unable to read 'format.json' from %s: %v\n", endpoints[i], sErr)
|
|
|
|
}
|
2020-03-08 12:12:07 -07:00
|
|
|
}
|
2018-12-04 10:25:56 -08:00
|
|
|
}
|
|
|
|
|
2018-04-03 23:58:48 -05:00
|
|
|
// Pre-emptively check if one of the formatted disks
|
|
|
|
// is invalid. This function returns success for the
|
|
|
|
// most part unless one of the formats is not consistent
|
2020-06-12 20:04:01 -07:00
|
|
|
// with expected Erasure format. For example if a user is
|
|
|
|
// trying to pool FS backend into an Erasure set.
|
|
|
|
if err = checkFormatErasureValues(formatConfigs, drivesPerSet); err != nil {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, err
|
2018-04-03 23:58:48 -05:00
|
|
|
}
|
|
|
|
|
2018-04-12 15:43:38 -07:00
|
|
|
// All disks report unformatted we should initialized everyone.
|
2020-06-12 20:04:01 -07:00
|
|
|
if shouldInitErasureDisks(sErrs) && firstDisk {
|
2020-05-13 20:25:29 -07:00
|
|
|
logger.Info("Formatting %s zone, %v set(s), %v drives per set.",
|
|
|
|
humanize.Ordinal(zoneCount), setCount, drivesPerSet)
|
2020-01-17 15:39:07 -08:00
|
|
|
|
2019-04-02 23:20:13 +05:30
|
|
|
// Initialize erasure code format on disks
|
2020-08-18 14:37:26 -07:00
|
|
|
format, err = initFormatErasure(GlobalContext, storageDisks, setCount, drivesPerSet, deploymentID, sErrs)
|
2019-04-02 23:20:13 +05:30
|
|
|
if err != nil {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, err
|
2019-04-02 23:20:13 +05:30
|
|
|
}
|
2020-05-13 20:25:29 -07:00
|
|
|
|
2019-04-02 23:20:13 +05:30
|
|
|
// Assign globalDeploymentID on first run for the
|
|
|
|
// minio server managing the first disk
|
|
|
|
globalDeploymentID = format.ID
|
2020-03-27 14:48:30 -07:00
|
|
|
return storageDisks, format, nil
|
2019-12-23 16:31:03 -08:00
|
|
|
}
|
|
|
|
|
2018-04-12 15:43:38 -07:00
|
|
|
// Return error when quorum unformatted disks - indicating we are
|
|
|
|
// waiting for first server to be online.
|
|
|
|
if quorumUnformattedDisks(sErrs) && !firstDisk {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, errNotFirstDisk
|
2018-04-12 15:43:38 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// Return error when quorum unformatted disks but waiting for rest
|
|
|
|
// of the servers to be online.
|
|
|
|
if quorumUnformattedDisks(sErrs) && firstDisk {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, errFirstDiskWait
|
2018-04-12 15:43:38 -07:00
|
|
|
}
|
|
|
|
|
2020-08-18 14:37:26 -07:00
|
|
|
// Mark all root disks down
|
|
|
|
markRootDisksAsDown(storageDisks, sErrs)
|
|
|
|
|
2018-04-03 23:58:48 -05:00
|
|
|
// Following function is added to fix a regressions which was introduced
|
|
|
|
// in release RELEASE.2018-03-16T22-52-12Z after migrating v1 to v2 to v3.
|
|
|
|
// This migration failed to capture '.This' field properly which indicates
|
|
|
|
// the disk UUID association. Below function is called to handle and fix
|
|
|
|
// this regression, for more info refer https://github.com/minio/minio/issues/5667
|
2020-06-12 20:04:01 -07:00
|
|
|
if err = fixFormatErasureV3(storageDisks, endpoints, formatConfigs); err != nil {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, err
|
2018-04-03 23:58:48 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
// If any of the .This field is still empty, we return error.
|
2020-06-12 20:04:01 -07:00
|
|
|
if formatErasureV3ThisEmpty(formatConfigs) {
|
|
|
|
return nil, nil, errErasureV3ThisEmpty
|
2018-04-03 23:58:48 -05:00
|
|
|
}
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
format, err = getFormatErasureInQuorum(formatConfigs)
|
2018-04-03 23:58:48 -05:00
|
|
|
if err != nil {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, err
|
2018-04-03 23:58:48 -05:00
|
|
|
}
|
|
|
|
|
2018-07-18 20:17:35 -07:00
|
|
|
if format.ID == "" {
|
2019-11-13 12:17:45 -08:00
|
|
|
// Not a first disk, wait until first disk fixes deploymentID
|
|
|
|
if !firstDisk {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, errNotFirstDisk
|
2019-11-13 12:17:45 -08:00
|
|
|
}
|
2020-06-12 20:04:01 -07:00
|
|
|
if err = formatErasureFixDeploymentID(endpoints, storageDisks, format); err != nil {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, err
|
2018-07-18 20:17:35 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2018-11-19 14:47:03 -08:00
|
|
|
globalDeploymentID = format.ID
|
2018-07-18 20:17:35 -07:00
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
if err = formatErasureFixLocalDeploymentID(endpoints, storageDisks, format); err != nil {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, err
|
2018-07-18 20:17:35 -07:00
|
|
|
}
|
2019-12-23 16:31:03 -08:00
|
|
|
|
2020-01-15 21:36:52 +01:00
|
|
|
// The will always recreate some directories inside .minio.sys of
|
|
|
|
// the local disk such as tmp, multipart and background-ops
|
2020-06-12 20:04:01 -07:00
|
|
|
initErasureMetaVolumesInLocalDisks(storageDisks, formatConfigs)
|
2020-01-15 21:36:52 +01:00
|
|
|
|
2020-03-27 14:48:30 -07:00
|
|
|
return storageDisks, format, nil
|
2018-04-03 23:58:48 -05:00
|
|
|
}
|
|
|
|
|
2018-02-15 17:45:57 -08:00
|
|
|
// Format disks before initialization of object layer.
|
2020-06-12 20:04:01 -07:00
|
|
|
func waitForFormatErasure(firstDisk bool, endpoints Endpoints, zoneCount, setCount, drivesPerSet int, deploymentID string) ([]StorageAPI, *formatErasureV3, error) {
|
2019-11-21 04:24:51 -08:00
|
|
|
if len(endpoints) == 0 || setCount == 0 || drivesPerSet == 0 {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, errInvalidArgument
|
2016-11-02 16:51:06 +01:00
|
|
|
}
|
2018-02-15 17:45:57 -08:00
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
if err := formatErasureMigrateLocalEndpoints(endpoints); err != nil {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, err
|
2016-08-30 19:22:27 -07:00
|
|
|
}
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
if err := formatErasureCleanupTmpLocalEndpoints(endpoints); err != nil {
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, err
|
2018-03-15 13:55:23 -07:00
|
|
|
}
|
|
|
|
|
2016-12-07 19:22:00 +01:00
|
|
|
// prepare getElapsedTime() to calculate elapsed time since we started trying formatting disks.
|
|
|
|
// All times are rounded to avoid showing milli, micro and nano seconds
|
|
|
|
formatStartTime := time.Now().Round(time.Second)
|
|
|
|
getElapsedTime := func() string {
|
|
|
|
return time.Now().Round(time.Second).Sub(formatStartTime).String()
|
|
|
|
}
|
|
|
|
|
2020-01-08 22:36:54 +01:00
|
|
|
// Wait on each try for an update.
|
|
|
|
ticker := time.NewTicker(500 * time.Millisecond)
|
|
|
|
defer ticker.Stop()
|
|
|
|
var tries int
|
2016-11-02 23:27:36 +01:00
|
|
|
for {
|
|
|
|
select {
|
2020-01-08 22:36:54 +01:00
|
|
|
case <-ticker.C:
|
2020-03-27 14:48:30 -07:00
|
|
|
storageDisks, format, err := connectLoadInitFormats(tries, firstDisk, endpoints, zoneCount, setCount, drivesPerSet, deploymentID)
|
2018-04-03 23:58:48 -05:00
|
|
|
if err != nil {
|
2020-01-08 22:36:54 +01:00
|
|
|
tries++
|
2018-04-03 23:58:48 -05:00
|
|
|
switch err {
|
|
|
|
case errNotFirstDisk:
|
|
|
|
// Fresh setup, wait for first server to be up.
|
2018-04-10 09:37:14 -07:00
|
|
|
logger.Info("Waiting for the first server to format the disks.")
|
2017-04-18 10:35:17 -07:00
|
|
|
continue
|
2018-04-12 15:43:38 -07:00
|
|
|
case errFirstDiskWait:
|
|
|
|
// Fresh setup, wait for other servers to come up.
|
|
|
|
logger.Info("Waiting for all other servers to be online to format the disks.")
|
|
|
|
continue
|
2020-06-12 20:04:01 -07:00
|
|
|
case errErasureReadQuorum:
|
2018-04-03 23:58:48 -05:00
|
|
|
// no quorum available continue to wait for minimum number of servers.
|
2018-04-10 09:37:14 -07:00
|
|
|
logger.Info("Waiting for a minimum of %d disks to come online (elapsed %s)\n", len(endpoints)/2, getElapsedTime())
|
2018-04-03 23:58:48 -05:00
|
|
|
continue
|
2020-06-12 20:04:01 -07:00
|
|
|
case errErasureV3ThisEmpty:
|
2018-04-03 23:58:48 -05:00
|
|
|
// need to wait for this error to be healed, so continue.
|
|
|
|
continue
|
|
|
|
default:
|
|
|
|
// For all other unhandled errors we exit and fail.
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, err
|
2017-04-18 10:35:17 -07:00
|
|
|
}
|
2016-12-11 15:18:55 -08:00
|
|
|
}
|
2020-03-27 14:48:30 -07:00
|
|
|
return storageDisks, format, nil
|
2018-02-06 15:07:17 -08:00
|
|
|
case <-globalOSSignalCh:
|
2020-03-27 14:48:30 -07:00
|
|
|
return nil, nil, fmt.Errorf("Initializing data volumes gracefully stopped")
|
2016-11-02 23:27:36 +01:00
|
|
|
}
|
|
|
|
}
|
2016-08-30 19:22:27 -07:00
|
|
|
}
|