2021-04-18 12:41:13 -07:00
|
|
|
// Copyright (c) 2015-2021 MinIO, Inc.
|
|
|
|
//
|
|
|
|
// This file is part of MinIO Object Storage stack
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
2020-03-26 21:07:39 -07:00
|
|
|
|
|
|
|
package madmin
|
|
|
|
|
|
|
|
import (
|
|
|
|
"context"
|
|
|
|
"encoding/json"
|
|
|
|
"io"
|
|
|
|
"net/http"
|
|
|
|
"net/url"
|
|
|
|
"time"
|
|
|
|
|
|
|
|
"github.com/minio/minio/pkg/disk"
|
|
|
|
"github.com/minio/minio/pkg/net"
|
|
|
|
|
2020-11-21 23:11:33 +05:30
|
|
|
smart "github.com/minio/minio/pkg/smart"
|
2021-03-01 00:15:46 -08:00
|
|
|
"github.com/shirou/gopsutil/v3/cpu"
|
|
|
|
diskhw "github.com/shirou/gopsutil/v3/disk"
|
|
|
|
"github.com/shirou/gopsutil/v3/host"
|
|
|
|
"github.com/shirou/gopsutil/v3/mem"
|
|
|
|
"github.com/shirou/gopsutil/v3/process"
|
2020-03-26 21:07:39 -07:00
|
|
|
)
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// HealthInfo - MinIO cluster's health Info
|
|
|
|
type HealthInfo struct {
|
|
|
|
TimeStamp time.Time `json:"timestamp,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
|
|
|
Perf PerfInfo `json:"perf,omitempty"`
|
|
|
|
Minio MinioHealthInfo `json:"minio,omitempty"`
|
|
|
|
Sys SysHealthInfo `json:"sys,omitempty"`
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// SysHealthInfo - Includes hardware and system information of the MinIO cluster
|
|
|
|
type SysHealthInfo struct {
|
|
|
|
CPUInfo []ServerCPUInfo `json:"cpus,omitempty"`
|
|
|
|
DiskHwInfo []ServerDiskHwInfo `json:"drives,omitempty"`
|
|
|
|
OsInfo []ServerOsInfo `json:"osinfos,omitempty"`
|
|
|
|
MemInfo []ServerMemInfo `json:"meminfos,omitempty"`
|
|
|
|
ProcInfo []ServerProcInfo `json:"procinfos,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// ServerProcInfo - Includes host process lvl information
|
|
|
|
type ServerProcInfo struct {
|
|
|
|
Addr string `json:"addr"`
|
|
|
|
Processes []SysProcess `json:"processes,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// SysProcess - Includes process lvl information about a single process
|
|
|
|
type SysProcess struct {
|
2021-02-06 11:02:28 +05:30
|
|
|
Pid int32 `json:"pid"`
|
|
|
|
Background bool `json:"background,omitempty"`
|
|
|
|
CPUPercent float64 `json:"cpupercent,omitempty"`
|
|
|
|
Children []int32 `json:"children,omitempty"`
|
|
|
|
CmdLine string `json:"cmd,omitempty"`
|
|
|
|
ConnectionCount int `json:"connection_count,omitempty"`
|
|
|
|
CreateTime int64 `json:"createtime,omitempty"`
|
|
|
|
Cwd string `json:"cwd,omitempty"`
|
|
|
|
Exe string `json:"exe,omitempty"`
|
|
|
|
Gids []int32 `json:"gids,omitempty"`
|
|
|
|
IOCounters *process.IOCountersStat `json:"iocounters,omitempty"`
|
|
|
|
IsRunning bool `json:"isrunning,omitempty"`
|
|
|
|
MemInfo *process.MemoryInfoStat `json:"meminfo,omitempty"`
|
|
|
|
MemMaps *[]process.MemoryMapsStat `json:"memmaps,omitempty"`
|
|
|
|
MemPercent float32 `json:"mempercent,omitempty"`
|
|
|
|
Name string `json:"name,omitempty"`
|
|
|
|
Nice int32 `json:"nice,omitempty"`
|
|
|
|
NumCtxSwitches *process.NumCtxSwitchesStat `json:"numctxswitches,omitempty"`
|
|
|
|
NumFds int32 `json:"numfds,omitempty"`
|
|
|
|
NumThreads int32 `json:"numthreads,omitempty"`
|
|
|
|
PageFaults *process.PageFaultsStat `json:"pagefaults,omitempty"`
|
|
|
|
Parent int32 `json:"parent,omitempty"`
|
|
|
|
Ppid int32 `json:"ppid,omitempty"`
|
|
|
|
Status string `json:"status,omitempty"`
|
|
|
|
Tgid int32 `json:"tgid,omitempty"`
|
|
|
|
Times *cpu.TimesStat `json:"cputimes,omitempty"`
|
|
|
|
Uids []int32 `json:"uids,omitempty"`
|
|
|
|
Username string `json:"username,omitempty"`
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// ServerMemInfo - Includes host virtual and swap mem information
|
|
|
|
type ServerMemInfo struct {
|
2020-03-26 21:07:39 -07:00
|
|
|
Addr string `json:"addr"`
|
|
|
|
SwapMem *mem.SwapMemoryStat `json:"swap,omitempty"`
|
|
|
|
VirtualMem *mem.VirtualMemoryStat `json:"virtualmem,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// ServerOsInfo - Includes host os information
|
|
|
|
type ServerOsInfo struct {
|
2020-03-26 21:07:39 -07:00
|
|
|
Addr string `json:"addr"`
|
|
|
|
Info *host.InfoStat `json:"info,omitempty"`
|
|
|
|
Sensors []host.TemperatureStat `json:"sensors,omitempty"`
|
|
|
|
Users []host.UserStat `json:"users,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// ServerCPUInfo - Includes cpu and timer stats of each node of the MinIO cluster
|
|
|
|
type ServerCPUInfo struct {
|
2020-03-26 21:07:39 -07:00
|
|
|
Addr string `json:"addr"`
|
|
|
|
CPUStat []cpu.InfoStat `json:"cpu,omitempty"`
|
|
|
|
TimeStat []cpu.TimesStat `json:"time,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// MinioHealthInfo - Includes MinIO confifuration information
|
|
|
|
type MinioHealthInfo struct {
|
2020-03-26 21:07:39 -07:00
|
|
|
Info InfoMessage `json:"info,omitempty"`
|
|
|
|
Config interface{} `json:"config,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
|
|
|
}
|
|
|
|
|
2020-11-21 23:11:33 +05:30
|
|
|
// ServerDiskHwInfo - Includes usage counters, disk counters and partitions
|
|
|
|
type ServerDiskHwInfo struct {
|
|
|
|
Addr string `json:"addr"`
|
|
|
|
Usage []*diskhw.UsageStat `json:"usages,omitempty"`
|
|
|
|
Partitions []PartitionStat `json:"partitions,omitempty"`
|
|
|
|
Counters map[string]diskhw.IOCountersStat `json:"counters,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
|
|
|
}
|
|
|
|
|
|
|
|
// PartitionStat - includes data from both shirou/psutil.diskHw.PartitionStat as well as SMART data
|
|
|
|
type PartitionStat struct {
|
|
|
|
Device string `json:"device"`
|
|
|
|
Mountpoint string `json:"mountpoint,omitempty"`
|
|
|
|
Fstype string `json:"fstype,omitempty"`
|
|
|
|
Opts string `json:"opts,omitempty"`
|
|
|
|
SmartInfo smart.Info `json:"smartInfo,omitempty"`
|
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// PerfInfo - Includes Drive and Net perf info for the entire MinIO cluster
|
|
|
|
type PerfInfo struct {
|
|
|
|
DriveInfo []ServerDrivesInfo `json:"drives,omitempty"`
|
|
|
|
Net []ServerNetHealthInfo `json:"net,omitempty"`
|
|
|
|
NetParallel ServerNetHealthInfo `json:"net_parallel,omitempty"`
|
2020-03-31 17:08:28 -07:00
|
|
|
Error string `json:"error,omitempty"`
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// ServerDrivesInfo - Drive info about all drives in a single MinIO node
|
|
|
|
type ServerDrivesInfo struct {
|
|
|
|
Addr string `json:"addr"`
|
2021-01-18 20:35:38 -08:00
|
|
|
Serial []DrivePerfInfo `json:"serial,omitempty"` // Drive perf info collected one drive at a time
|
|
|
|
Parallel []DrivePerfInfo `json:"parallel,omitempty"` // Drive perf info collected in parallel
|
2020-11-21 02:22:53 +05:30
|
|
|
Error string `json:"error,omitempty"`
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// DrivePerfInfo - Stats about a single drive in a MinIO node
|
|
|
|
type DrivePerfInfo struct {
|
2020-03-26 21:07:39 -07:00
|
|
|
Path string `json:"endpoint"`
|
|
|
|
Latency disk.Latency `json:"latency,omitempty"`
|
|
|
|
Throughput disk.Throughput `json:"throughput,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// ServerNetHealthInfo - Network health info about a single MinIO node
|
|
|
|
type ServerNetHealthInfo struct {
|
|
|
|
Addr string `json:"addr"`
|
|
|
|
Net []NetPerfInfo `json:"net,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// NetPerfInfo - one-to-one network connectivity Stats between 2 MinIO nodes
|
|
|
|
type NetPerfInfo struct {
|
2020-03-26 21:07:39 -07:00
|
|
|
Addr string `json:"remote"`
|
|
|
|
Latency net.Latency `json:"latency,omitempty"`
|
|
|
|
Throughput net.Throughput `json:"throughput,omitempty"`
|
|
|
|
Error string `json:"error,omitempty"`
|
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// HealthDataType - Typed Health data types
|
|
|
|
type HealthDataType string
|
2020-03-26 21:07:39 -07:00
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// HealthDataTypes
|
2020-03-26 21:07:39 -07:00
|
|
|
const (
|
2020-11-21 02:22:53 +05:30
|
|
|
HealthDataTypePerfDrive HealthDataType = "perfdrive"
|
|
|
|
HealthDataTypePerfNet HealthDataType = "perfnet"
|
|
|
|
HealthDataTypeMinioInfo HealthDataType = "minioinfo"
|
|
|
|
HealthDataTypeMinioConfig HealthDataType = "minioconfig"
|
|
|
|
HealthDataTypeSysCPU HealthDataType = "syscpu"
|
|
|
|
HealthDataTypeSysDiskHw HealthDataType = "sysdiskhw"
|
|
|
|
HealthDataTypeSysDocker HealthDataType = "sysdocker" // is this really needed?
|
|
|
|
HealthDataTypeSysOsInfo HealthDataType = "sysosinfo"
|
|
|
|
HealthDataTypeSysLoad HealthDataType = "sysload" // provides very little info. Making it TBD
|
|
|
|
HealthDataTypeSysMem HealthDataType = "sysmem"
|
|
|
|
HealthDataTypeSysNet HealthDataType = "sysnet"
|
|
|
|
HealthDataTypeSysProcess HealthDataType = "sysprocess"
|
2020-03-26 21:07:39 -07:00
|
|
|
)
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// HealthDataTypesMap - Map of Health datatypes
|
|
|
|
var HealthDataTypesMap = map[string]HealthDataType{
|
|
|
|
"perfdrive": HealthDataTypePerfDrive,
|
|
|
|
"perfnet": HealthDataTypePerfNet,
|
|
|
|
"minioinfo": HealthDataTypeMinioInfo,
|
|
|
|
"minioconfig": HealthDataTypeMinioConfig,
|
|
|
|
"syscpu": HealthDataTypeSysCPU,
|
|
|
|
"sysdiskhw": HealthDataTypeSysDiskHw,
|
|
|
|
"sysdocker": HealthDataTypeSysDocker,
|
|
|
|
"sysosinfo": HealthDataTypeSysOsInfo,
|
|
|
|
"sysload": HealthDataTypeSysLoad,
|
|
|
|
"sysmem": HealthDataTypeSysMem,
|
|
|
|
"sysnet": HealthDataTypeSysNet,
|
|
|
|
"sysprocess": HealthDataTypeSysProcess,
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// HealthDataTypesList - List of Health datatypes
|
|
|
|
var HealthDataTypesList = []HealthDataType{
|
|
|
|
HealthDataTypePerfDrive,
|
|
|
|
HealthDataTypePerfNet,
|
|
|
|
HealthDataTypeMinioInfo,
|
|
|
|
HealthDataTypeMinioConfig,
|
|
|
|
HealthDataTypeSysCPU,
|
|
|
|
HealthDataTypeSysDiskHw,
|
|
|
|
HealthDataTypeSysDocker,
|
|
|
|
HealthDataTypeSysOsInfo,
|
|
|
|
HealthDataTypeSysLoad,
|
|
|
|
HealthDataTypeSysMem,
|
|
|
|
HealthDataTypeSysNet,
|
|
|
|
HealthDataTypeSysProcess,
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
// ServerHealthInfo - Connect to a minio server and call Health Info Management API
|
|
|
|
// to fetch server's information represented by HealthInfo structure
|
|
|
|
func (adm *AdminClient) ServerHealthInfo(ctx context.Context, healthDataTypes []HealthDataType, deadline time.Duration) <-chan HealthInfo {
|
|
|
|
respChan := make(chan HealthInfo)
|
2020-03-26 21:07:39 -07:00
|
|
|
go func() {
|
|
|
|
v := url.Values{}
|
|
|
|
|
2020-04-14 11:48:32 -07:00
|
|
|
v.Set("deadline",
|
|
|
|
deadline.Truncate(1*time.Second).String())
|
|
|
|
|
2020-03-26 21:07:39 -07:00
|
|
|
// start with all set to false
|
2020-11-21 02:22:53 +05:30
|
|
|
for _, d := range HealthDataTypesList {
|
2020-03-26 21:07:39 -07:00
|
|
|
v.Set(string(d), "false")
|
|
|
|
}
|
|
|
|
|
|
|
|
// only 'trueify' user provided values
|
2020-11-21 02:22:53 +05:30
|
|
|
for _, d := range healthDataTypes {
|
2020-03-26 21:07:39 -07:00
|
|
|
v.Set(string(d), "true")
|
|
|
|
}
|
2020-11-21 02:22:53 +05:30
|
|
|
var healthInfoMessage HealthInfo
|
|
|
|
healthInfoMessage.TimeStamp = time.Now()
|
2020-03-26 21:07:39 -07:00
|
|
|
|
|
|
|
resp, err := adm.executeMethod(ctx, "GET", requestData{
|
2020-11-21 02:22:53 +05:30
|
|
|
relPath: adminAPIPrefix + "/healthinfo",
|
2020-03-26 21:07:39 -07:00
|
|
|
queryValues: v,
|
|
|
|
})
|
|
|
|
|
|
|
|
defer closeResponse(resp)
|
|
|
|
if err != nil {
|
2020-11-21 02:22:53 +05:30
|
|
|
respChan <- HealthInfo{
|
2020-03-26 21:07:39 -07:00
|
|
|
Error: err.Error(),
|
|
|
|
}
|
2020-04-08 06:04:27 -07:00
|
|
|
close(respChan)
|
2020-03-26 21:07:39 -07:00
|
|
|
return
|
|
|
|
}
|
2020-04-08 06:04:27 -07:00
|
|
|
|
2020-03-26 21:07:39 -07:00
|
|
|
// Check response http status code
|
|
|
|
if resp.StatusCode != http.StatusOK {
|
2020-11-21 02:22:53 +05:30
|
|
|
respChan <- HealthInfo{
|
2020-03-26 21:07:39 -07:00
|
|
|
Error: httpRespToErrorResponse(resp).Error(),
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
2020-04-08 06:04:27 -07:00
|
|
|
|
2020-03-26 21:07:39 -07:00
|
|
|
// Unmarshal the server's json response
|
|
|
|
decoder := json.NewDecoder(resp.Body)
|
|
|
|
for {
|
2020-11-21 02:22:53 +05:30
|
|
|
err := decoder.Decode(&healthInfoMessage)
|
|
|
|
healthInfoMessage.TimeStamp = time.Now()
|
2020-04-08 06:04:27 -07:00
|
|
|
|
2020-03-26 21:07:39 -07:00
|
|
|
if err == io.EOF {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
if err != nil {
|
2020-11-21 02:22:53 +05:30
|
|
|
respChan <- HealthInfo{
|
2020-03-26 21:07:39 -07:00
|
|
|
Error: err.Error(),
|
|
|
|
}
|
|
|
|
}
|
2020-11-21 02:22:53 +05:30
|
|
|
respChan <- healthInfoMessage
|
2020-03-26 21:07:39 -07:00
|
|
|
}
|
|
|
|
|
2020-11-21 02:22:53 +05:30
|
|
|
respChan <- healthInfoMessage
|
2021-03-19 03:10:21 +05:30
|
|
|
|
|
|
|
if v.Get(string(HealthDataTypeMinioInfo)) == "true" {
|
|
|
|
info, err := adm.ServerInfo(ctx)
|
|
|
|
if err != nil {
|
|
|
|
respChan <- HealthInfo{
|
|
|
|
Error: err.Error(),
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
healthInfoMessage.Minio.Info = info
|
|
|
|
respChan <- healthInfoMessage
|
|
|
|
}
|
|
|
|
|
2020-03-26 21:07:39 -07:00
|
|
|
close(respChan)
|
|
|
|
}()
|
|
|
|
return respChan
|
|
|
|
}
|
2021-01-18 20:35:38 -08:00
|
|
|
|
|
|
|
// GetTotalCapacity gets the total capacity a server holds.
|
|
|
|
func (s *ServerDiskHwInfo) GetTotalCapacity() (capacity uint64) {
|
|
|
|
for _, u := range s.Usage {
|
|
|
|
capacity += u.Total
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// GetTotalFreeCapacity gets the total capacity that is free.
|
|
|
|
func (s *ServerDiskHwInfo) GetTotalFreeCapacity() (capacity uint64) {
|
|
|
|
for _, u := range s.Usage {
|
|
|
|
capacity += u.Free
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|
|
|
|
|
|
|
|
// GetTotalUsedCapacity gets the total capacity used.
|
|
|
|
func (s *ServerDiskHwInfo) GetTotalUsedCapacity() (capacity uint64) {
|
|
|
|
for _, u := range s.Usage {
|
|
|
|
capacity += u.Used
|
|
|
|
}
|
|
|
|
return
|
|
|
|
}
|