2021-04-18 12:41:13 -07:00
|
|
|
// Copyright (c) 2015-2021 MinIO, Inc.
|
|
|
|
//
|
|
|
|
// This file is part of MinIO Object Storage stack
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
2020-06-12 20:04:01 -07:00
|
|
|
|
|
|
|
package cmd
|
|
|
|
|
|
|
|
import (
|
2021-11-18 12:15:22 -08:00
|
|
|
"encoding/binary"
|
2020-06-12 20:04:01 -07:00
|
|
|
"encoding/hex"
|
|
|
|
"encoding/json"
|
|
|
|
"fmt"
|
|
|
|
"time"
|
|
|
|
|
2021-11-18 12:15:22 -08:00
|
|
|
"github.com/cespare/xxhash/v2"
|
2020-06-12 20:04:01 -07:00
|
|
|
jsoniter "github.com/json-iterator/go"
|
2021-06-01 14:59:40 -07:00
|
|
|
"github.com/minio/minio/internal/logger"
|
2020-06-12 20:04:01 -07:00
|
|
|
)
|
|
|
|
|
|
|
|
// XL constants.
|
|
|
|
const (
|
|
|
|
// XL metadata file carries per object metadata.
|
|
|
|
xlStorageFormatFileV1 = "xl.json"
|
|
|
|
)
|
|
|
|
|
|
|
|
// Valid - tells us if the format is sane by validating
|
|
|
|
// format version and erasure coding information.
|
|
|
|
func (m *xlMetaV1Object) valid() bool {
|
|
|
|
return isXLMetaFormatValid(m.Version, m.Format) &&
|
|
|
|
isXLMetaErasureInfoValid(m.Erasure.DataBlocks, m.Erasure.ParityBlocks)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Verifies if the backend format metadata is sane by validating
|
|
|
|
// the version string and format style.
|
|
|
|
func isXLMetaFormatValid(version, format string) bool {
|
|
|
|
return ((version == xlMetaVersion101 ||
|
|
|
|
version == xlMetaVersion100) &&
|
|
|
|
format == xlMetaFormat)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Verifies if the backend format metadata is sane by validating
|
|
|
|
// the ErasureInfo, i.e. data and parity blocks.
|
|
|
|
func isXLMetaErasureInfoValid(data, parity int) bool {
|
2022-05-30 10:58:37 -07:00
|
|
|
return ((data >= parity) && (data > 0) && (parity >= 0))
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
//go:generate msgp -file=$GOFILE -unexported
|
|
|
|
|
|
|
|
// A xlMetaV1Object represents `xl.meta` metadata header.
|
|
|
|
type xlMetaV1Object struct {
|
|
|
|
Version string `json:"version"` // Version of the current `xl.meta`.
|
|
|
|
Format string `json:"format"` // Format of the current `xl.meta`.
|
|
|
|
Stat StatInfo `json:"stat"` // Stat of the current object `xl.meta`.
|
|
|
|
// Erasure coded info for the current object `xl.meta`.
|
|
|
|
Erasure ErasureInfo `json:"erasure"`
|
|
|
|
// MinIO release tag for current object `xl.meta`.
|
|
|
|
Minio struct {
|
|
|
|
Release string `json:"release"`
|
|
|
|
} `json:"minio"`
|
|
|
|
// Metadata map for current object `xl.meta`.
|
|
|
|
Meta map[string]string `json:"meta,omitempty"`
|
|
|
|
// Captures all the individual object `xl.meta`.
|
|
|
|
Parts []ObjectPartInfo `json:"parts,omitempty"`
|
|
|
|
|
|
|
|
// Dummy values used for legacy use cases.
|
|
|
|
VersionID string `json:"versionId,omitempty"`
|
|
|
|
DataDir string `json:"dataDir,omitempty"` // always points to "legacy"
|
|
|
|
}
|
|
|
|
|
|
|
|
// StatInfo - carries stat information of the object.
|
|
|
|
type StatInfo struct {
|
|
|
|
Size int64 `json:"size"` // Size of the object `xl.meta`.
|
|
|
|
ModTime time.Time `json:"modTime"` // ModTime of the object `xl.meta`.
|
2021-10-01 11:50:00 -07:00
|
|
|
Name string `json:"name"`
|
|
|
|
Dir bool `json:"dir"`
|
2021-10-21 11:20:13 -07:00
|
|
|
Mode uint32 `json:"mode"`
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// ErasureInfo holds erasure coding and bitrot related information.
|
|
|
|
type ErasureInfo struct {
|
|
|
|
// Algorithm is the string representation of erasure-coding-algorithm
|
|
|
|
Algorithm string `json:"algorithm"`
|
|
|
|
// DataBlocks is the number of data blocks for erasure-coding
|
|
|
|
DataBlocks int `json:"data"`
|
|
|
|
// ParityBlocks is the number of parity blocks for erasure-coding
|
|
|
|
ParityBlocks int `json:"parity"`
|
|
|
|
// BlockSize is the size of one erasure-coded block
|
|
|
|
BlockSize int64 `json:"blockSize"`
|
|
|
|
// Index is the index of the current disk
|
|
|
|
Index int `json:"index"`
|
|
|
|
// Distribution is the distribution of the data and parity blocks
|
|
|
|
Distribution []int `json:"distribution"`
|
|
|
|
// Checksums holds all bitrot checksums of all erasure encoded blocks
|
|
|
|
Checksums []ChecksumInfo `json:"checksum,omitempty"`
|
|
|
|
}
|
|
|
|
|
2023-06-18 18:20:15 -07:00
|
|
|
// Equal equates current erasure info with newer erasure info.
|
|
|
|
// returns false if one of the following check fails
|
|
|
|
// - erasure algorithm is different
|
|
|
|
// - data blocks are different
|
|
|
|
// - parity blocks are different
|
|
|
|
// - block size is different
|
|
|
|
// - distribution array size is different
|
|
|
|
// - distribution indexes are different
|
|
|
|
func (ei ErasureInfo) Equal(nei ErasureInfo) bool {
|
|
|
|
if ei.Algorithm != nei.Algorithm {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if ei.DataBlocks != nei.DataBlocks {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if ei.ParityBlocks != nei.ParityBlocks {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if ei.BlockSize != nei.BlockSize {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
if len(ei.Distribution) != len(nei.Distribution) {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
for i, ecindex := range ei.Distribution {
|
|
|
|
if ecindex != nei.Distribution[i] {
|
|
|
|
return false
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return true
|
|
|
|
}
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// BitrotAlgorithm specifies a algorithm used for bitrot protection.
|
|
|
|
type BitrotAlgorithm uint
|
|
|
|
|
|
|
|
const (
|
|
|
|
// SHA256 represents the SHA-256 hash function
|
|
|
|
SHA256 BitrotAlgorithm = 1 + iota
|
|
|
|
// HighwayHash256 represents the HighwayHash-256 hash function
|
|
|
|
HighwayHash256
|
|
|
|
// HighwayHash256S represents the Streaming HighwayHash-256 hash function
|
|
|
|
HighwayHash256S
|
|
|
|
// BLAKE2b512 represents the BLAKE2b-512 hash function
|
|
|
|
BLAKE2b512
|
|
|
|
)
|
|
|
|
|
|
|
|
// DefaultBitrotAlgorithm is the default algorithm used for bitrot protection.
|
|
|
|
const (
|
|
|
|
DefaultBitrotAlgorithm = HighwayHash256S
|
|
|
|
)
|
|
|
|
|
|
|
|
// ObjectPartInfo Info of each part kept in the multipart metadata
|
|
|
|
// file after CompleteMultipartUpload() is called.
|
|
|
|
type ObjectPartInfo struct {
|
2022-08-30 01:57:16 +02:00
|
|
|
ETag string `json:"etag,omitempty"`
|
|
|
|
Number int `json:"number"`
|
|
|
|
Size int64 `json:"size"` // Size of the part on the disk.
|
|
|
|
ActualSize int64 `json:"actualSize"` // Original size of the part without compression or encryption bytes.
|
|
|
|
ModTime time.Time `json:"modTime"` // Date and time at which the part was uploaded.
|
|
|
|
Index []byte `json:"index,omitempty" msg:"index,omitempty"`
|
|
|
|
Checksums map[string]string `json:"crc,omitempty" msg:"crc,omitempty"` // Content Checksums
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
|
|
|
|
|
|
|
// ChecksumInfo - carries checksums of individual scattered parts per disk.
|
|
|
|
type ChecksumInfo struct {
|
|
|
|
PartNumber int
|
|
|
|
Algorithm BitrotAlgorithm
|
|
|
|
Hash []byte
|
|
|
|
}
|
|
|
|
|
|
|
|
type checksumInfoJSON struct {
|
|
|
|
Name string `json:"name"`
|
|
|
|
Algorithm string `json:"algorithm"`
|
|
|
|
Hash string `json:"hash,omitempty"`
|
|
|
|
}
|
|
|
|
|
|
|
|
// MarshalJSON marshals the ChecksumInfo struct
|
|
|
|
func (c ChecksumInfo) MarshalJSON() ([]byte, error) {
|
|
|
|
info := checksumInfoJSON{
|
|
|
|
Name: fmt.Sprintf("part.%d", c.PartNumber),
|
|
|
|
Algorithm: c.Algorithm.String(),
|
|
|
|
Hash: hex.EncodeToString(c.Hash),
|
|
|
|
}
|
|
|
|
return json.Marshal(info)
|
|
|
|
}
|
|
|
|
|
|
|
|
// UnmarshalJSON - custom checksum info unmarshaller
|
|
|
|
func (c *ChecksumInfo) UnmarshalJSON(data []byte) error {
|
|
|
|
var info checksumInfoJSON
|
2022-01-02 09:15:06 -08:00
|
|
|
json := jsoniter.ConfigCompatibleWithStandardLibrary
|
2020-06-12 20:04:01 -07:00
|
|
|
if err := json.Unmarshal(data, &info); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
sum, err := hex.DecodeString(info.Hash)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
c.Algorithm = BitrotAlgorithmFromString(info.Algorithm)
|
|
|
|
c.Hash = sum
|
|
|
|
if _, err = fmt.Sscanf(info.Name, "part.%d", &c.PartNumber); err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
|
|
|
|
if !c.Algorithm.Available() {
|
|
|
|
logger.LogIf(GlobalContext, errBitrotHashAlgoInvalid)
|
|
|
|
return errBitrotHashAlgoInvalid
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
// constant and shouldn't be changed.
|
2021-04-19 10:30:42 -07:00
|
|
|
const (
|
|
|
|
legacyDataDir = "legacy"
|
|
|
|
)
|
2020-06-12 20:04:01 -07:00
|
|
|
|
|
|
|
func (m *xlMetaV1Object) ToFileInfo(volume, path string) (FileInfo, error) {
|
|
|
|
if !m.valid() {
|
|
|
|
return FileInfo{}, errFileCorrupt
|
|
|
|
}
|
2021-04-19 10:30:42 -07:00
|
|
|
|
2020-11-12 12:12:09 -08:00
|
|
|
fi := FileInfo{
|
2021-12-02 11:29:16 -08:00
|
|
|
Volume: volume,
|
|
|
|
Name: path,
|
|
|
|
ModTime: m.Stat.ModTime,
|
|
|
|
Size: m.Stat.Size,
|
|
|
|
Metadata: m.Meta,
|
|
|
|
Parts: m.Parts,
|
|
|
|
Erasure: m.Erasure,
|
|
|
|
VersionID: m.VersionID,
|
|
|
|
DataDir: m.DataDir,
|
|
|
|
XLV1: true,
|
|
|
|
NumVersions: 1,
|
2020-11-12 12:12:09 -08:00
|
|
|
}
|
2021-11-17 15:49:12 -08:00
|
|
|
|
2020-11-12 12:12:09 -08:00
|
|
|
return fi, nil
|
2020-06-12 20:04:01 -07:00
|
|
|
}
|
|
|
|
|
2021-11-18 12:15:22 -08:00
|
|
|
// Signature will return a signature that is expected to be the same across all disks.
|
|
|
|
func (m *xlMetaV1Object) Signature() [4]byte {
|
|
|
|
// Shallow copy
|
|
|
|
c := *m
|
|
|
|
// Zero unimportant fields
|
|
|
|
c.Erasure.Index = 0
|
|
|
|
c.Minio.Release = ""
|
|
|
|
crc := hashDeterministicString(c.Meta)
|
|
|
|
c.Meta = nil
|
|
|
|
|
|
|
|
if bts, err := c.MarshalMsg(metaDataPoolGet()); err == nil {
|
|
|
|
crc ^= xxhash.Sum64(bts)
|
|
|
|
metaDataPoolPut(bts)
|
|
|
|
}
|
|
|
|
|
|
|
|
// Combine upper and lower part
|
|
|
|
var tmp [4]byte
|
|
|
|
binary.LittleEndian.PutUint32(tmp[:], uint32(crc^(crc>>32)))
|
|
|
|
return tmp
|
|
|
|
}
|
|
|
|
|
2020-06-12 20:04:01 -07:00
|
|
|
// XL metadata constants.
|
|
|
|
const (
|
|
|
|
// XL meta version.
|
|
|
|
xlMetaVersion101 = "1.0.1"
|
|
|
|
|
|
|
|
// XL meta version.
|
|
|
|
xlMetaVersion100 = "1.0.0"
|
|
|
|
|
|
|
|
// XL meta format string.
|
|
|
|
xlMetaFormat = "xl"
|
|
|
|
)
|