2022-06-07 04:44:52 +05:30
|
|
|
// Copyright (c) 2015-2022 MinIO, Inc.
|
|
|
|
//
|
|
|
|
// This file is part of MinIO Object Storage stack
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
package cmd
|
|
|
|
|
|
|
|
import (
|
2022-11-16 03:23:05 +05:30
|
|
|
"bytes"
|
|
|
|
"compress/gzip"
|
2022-06-07 04:44:52 +05:30
|
|
|
"context"
|
2022-11-16 03:23:05 +05:30
|
|
|
"encoding/json"
|
|
|
|
"errors"
|
2022-06-07 04:44:52 +05:30
|
|
|
"fmt"
|
|
|
|
"math/rand"
|
2022-11-16 03:23:05 +05:30
|
|
|
"net/url"
|
2022-06-07 04:44:52 +05:30
|
|
|
"time"
|
|
|
|
|
2023-06-19 17:53:08 -07:00
|
|
|
"github.com/minio/madmin-go/v3"
|
2022-06-07 04:44:52 +05:30
|
|
|
)
|
|
|
|
|
2022-10-27 00:20:01 -07:00
|
|
|
var callhomeLeaderLockTimeout = newDynamicTimeout(30*time.Second, 10*time.Second)
|
2022-06-07 04:44:52 +05:30
|
|
|
|
|
|
|
// initCallhome will start the callhome task in the background.
|
|
|
|
func initCallhome(ctx context.Context, objAPI ObjectLayer) {
|
2022-10-27 00:20:01 -07:00
|
|
|
if !globalCallhomeConfig.Enabled() {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
2022-06-07 04:44:52 +05:30
|
|
|
go func() {
|
|
|
|
r := rand.New(rand.NewSource(time.Now().UnixNano()))
|
|
|
|
// Leader node (that successfully acquires the lock inside runCallhome)
|
|
|
|
// will keep performing the callhome. If the leader goes down for some reason,
|
|
|
|
// the lock will be released and another node will acquire it and take over
|
|
|
|
// because of this loop.
|
|
|
|
for {
|
2022-10-27 00:20:01 -07:00
|
|
|
if !globalCallhomeConfig.Enabled() {
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
if !runCallhome(ctx, objAPI) {
|
|
|
|
// callhome was disabled or context was canceled
|
2022-06-07 04:44:52 +05:30
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// callhome running on a different node.
|
|
|
|
// sleep for some time and try again.
|
2022-10-27 00:20:01 -07:00
|
|
|
duration := time.Duration(r.Float64() * float64(globalCallhomeConfig.FrequencyDur()))
|
2022-06-07 04:44:52 +05:30
|
|
|
if duration < time.Second {
|
2024-01-17 23:03:17 -08:00
|
|
|
// Make sure to sleep at least a second to avoid high CPU ticks.
|
2022-06-07 04:44:52 +05:30
|
|
|
duration = time.Second
|
|
|
|
}
|
|
|
|
time.Sleep(duration)
|
|
|
|
}
|
|
|
|
}()
|
|
|
|
}
|
|
|
|
|
2022-10-27 00:20:01 -07:00
|
|
|
func runCallhome(ctx context.Context, objAPI ObjectLayer) bool {
|
2022-06-07 04:44:52 +05:30
|
|
|
// Make sure only 1 callhome is running on the cluster.
|
|
|
|
locker := objAPI.NewNSLock(minioMetaBucket, "callhome/runCallhome.lock")
|
|
|
|
lkctx, err := locker.GetLock(ctx, callhomeLeaderLockTimeout)
|
|
|
|
if err != nil {
|
2022-10-27 00:20:01 -07:00
|
|
|
// lock timedout means some other node is the leader,
|
|
|
|
// cycle back return 'true'
|
|
|
|
return true
|
2022-06-07 04:44:52 +05:30
|
|
|
}
|
|
|
|
|
|
|
|
ctx = lkctx.Context()
|
2022-12-24 04:49:07 +01:00
|
|
|
defer locker.Unlock(lkctx)
|
2022-06-07 04:44:52 +05:30
|
|
|
|
2022-10-27 00:20:01 -07:00
|
|
|
callhomeTimer := time.NewTimer(globalCallhomeConfig.FrequencyDur())
|
2022-06-07 04:44:52 +05:30
|
|
|
defer callhomeTimer.Stop()
|
|
|
|
|
|
|
|
for {
|
2022-10-27 00:20:01 -07:00
|
|
|
if !globalCallhomeConfig.Enabled() {
|
|
|
|
// Stop the processing as callhome got disabled
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
|
2022-06-07 04:44:52 +05:30
|
|
|
select {
|
|
|
|
case <-ctx.Done():
|
2022-10-27 00:20:01 -07:00
|
|
|
// indicates that we do not need to run callhome anymore
|
|
|
|
return false
|
2022-06-07 04:44:52 +05:30
|
|
|
case <-callhomeTimer.C:
|
2022-10-27 00:20:01 -07:00
|
|
|
if !globalCallhomeConfig.Enabled() {
|
2022-06-07 04:44:52 +05:30
|
|
|
// Stop the processing as callhome got disabled
|
2022-10-27 00:20:01 -07:00
|
|
|
return false
|
2022-06-07 04:44:52 +05:30
|
|
|
}
|
2022-10-27 00:20:01 -07:00
|
|
|
|
2022-06-07 04:44:52 +05:30
|
|
|
performCallhome(ctx)
|
|
|
|
|
|
|
|
// Reset the timer for next cycle.
|
2022-10-27 00:20:01 -07:00
|
|
|
callhomeTimer.Reset(globalCallhomeConfig.FrequencyDur())
|
2022-06-07 04:44:52 +05:30
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
func performCallhome(ctx context.Context) {
|
2022-11-16 03:23:05 +05:30
|
|
|
deadline := 10 * time.Second // Default deadline is 10secs for callhome
|
|
|
|
objectAPI := newObjectLayerFn()
|
|
|
|
if objectAPI == nil {
|
2024-04-04 13:04:40 +01:00
|
|
|
internalLogIf(ctx, errors.New("Callhome: object layer not ready"))
|
2022-11-16 03:23:05 +05:30
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
healthCtx, healthCancel := context.WithTimeout(ctx, deadline)
|
|
|
|
defer healthCancel()
|
|
|
|
|
|
|
|
healthInfoCh := make(chan madmin.HealthInfo)
|
|
|
|
|
|
|
|
query := url.Values{}
|
|
|
|
for _, k := range madmin.HealthDataTypesList {
|
|
|
|
query.Set(string(k), "true")
|
|
|
|
}
|
|
|
|
|
|
|
|
healthInfo := madmin.HealthInfo{
|
2022-11-23 20:41:22 +05:30
|
|
|
TimeStamp: time.Now().UTC(),
|
|
|
|
Version: madmin.HealthInfoVersion,
|
2022-11-16 03:23:05 +05:30
|
|
|
Minio: madmin.MinioHealthInfo{
|
|
|
|
Info: madmin.MinioInfo{
|
2023-10-18 08:06:57 -07:00
|
|
|
DeploymentID: globalDeploymentID(),
|
2022-11-16 03:23:05 +05:30
|
|
|
},
|
|
|
|
},
|
|
|
|
}
|
|
|
|
|
|
|
|
go fetchHealthInfo(healthCtx, objectAPI, &query, healthInfoCh, healthInfo)
|
|
|
|
|
|
|
|
for {
|
|
|
|
select {
|
|
|
|
case hi, hasMore := <-healthInfoCh:
|
|
|
|
if !hasMore {
|
|
|
|
// Received all data. Send to SUBNET and return
|
|
|
|
err := sendHealthInfo(ctx, healthInfo)
|
|
|
|
if err != nil {
|
2024-04-04 13:04:40 +01:00
|
|
|
internalLogIf(ctx, fmt.Errorf("Unable to perform callhome: %w", err))
|
2022-11-16 03:23:05 +05:30
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
healthInfo = hi
|
|
|
|
case <-healthCtx.Done():
|
|
|
|
return
|
|
|
|
}
|
2022-06-07 04:44:52 +05:30
|
|
|
}
|
|
|
|
}
|
2022-06-27 03:58:25 -07:00
|
|
|
|
|
|
|
const (
|
2023-11-24 23:29:35 +05:30
|
|
|
subnetHealthPath = "/api/health/upload"
|
2022-06-27 03:58:25 -07:00
|
|
|
)
|
|
|
|
|
2022-11-16 03:23:05 +05:30
|
|
|
func sendHealthInfo(ctx context.Context, healthInfo madmin.HealthInfo) error {
|
2023-11-24 23:29:35 +05:30
|
|
|
url := globalSubnetConfig.BaseURL + subnetHealthPath
|
2022-11-16 03:23:05 +05:30
|
|
|
|
|
|
|
filename := fmt.Sprintf("health_%s.json.gz", UTCNow().Format("20060102150405"))
|
2023-03-23 12:54:58 +05:30
|
|
|
url += "?filename=" + filename
|
2022-11-16 03:23:05 +05:30
|
|
|
|
|
|
|
_, err := globalSubnetConfig.Upload(url, filename, createHealthJSONGzip(ctx, healthInfo))
|
2022-06-27 03:58:25 -07:00
|
|
|
return err
|
|
|
|
}
|
2022-11-16 03:23:05 +05:30
|
|
|
|
|
|
|
func createHealthJSONGzip(ctx context.Context, healthInfo madmin.HealthInfo) []byte {
|
|
|
|
var b bytes.Buffer
|
|
|
|
gzWriter := gzip.NewWriter(&b)
|
|
|
|
|
|
|
|
header := struct {
|
|
|
|
Version string `json:"version"`
|
|
|
|
}{Version: healthInfo.Version}
|
|
|
|
|
|
|
|
enc := json.NewEncoder(gzWriter)
|
|
|
|
if e := enc.Encode(header); e != nil {
|
2024-04-04 13:04:40 +01:00
|
|
|
internalLogIf(ctx, fmt.Errorf("Could not encode health info header: %w", e))
|
2022-11-16 03:23:05 +05:30
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
if e := enc.Encode(healthInfo); e != nil {
|
2024-04-04 13:04:40 +01:00
|
|
|
internalLogIf(ctx, fmt.Errorf("Could not encode health info: %w", e))
|
2022-11-16 03:23:05 +05:30
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
gzWriter.Flush()
|
|
|
|
gzWriter.Close()
|
|
|
|
|
|
|
|
return b.Bytes()
|
|
|
|
}
|