2021-04-18 12:41:13 -07:00
|
|
|
// Copyright (c) 2015-2021 MinIO, Inc.
|
|
|
|
//
|
|
|
|
// This file is part of MinIO Object Storage stack
|
|
|
|
//
|
|
|
|
// This program is free software: you can redistribute it and/or modify
|
|
|
|
// it under the terms of the GNU Affero General Public License as published by
|
|
|
|
// the Free Software Foundation, either version 3 of the License, or
|
|
|
|
// (at your option) any later version.
|
|
|
|
//
|
|
|
|
// This program is distributed in the hope that it will be useful
|
|
|
|
// but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
// GNU Affero General Public License for more details.
|
|
|
|
//
|
|
|
|
// You should have received a copy of the GNU Affero General Public License
|
|
|
|
// along with this program. If not, see <http://www.gnu.org/licenses/>.
|
2016-04-29 17:52:17 -07:00
|
|
|
|
2016-08-18 16:23:42 -07:00
|
|
|
package cmd
|
2016-04-29 17:52:17 -07:00
|
|
|
|
2016-05-25 01:33:39 -07:00
|
|
|
import (
|
2021-03-08 11:30:43 -08:00
|
|
|
"sync"
|
2019-07-05 14:06:12 -07:00
|
|
|
|
2021-06-17 08:16:31 -07:00
|
|
|
"github.com/dustin/go-humanize"
|
2016-05-25 01:33:39 -07:00
|
|
|
)
|
2016-04-29 17:52:17 -07:00
|
|
|
|
2016-05-29 15:38:14 -07:00
|
|
|
const (
|
|
|
|
// Block size used for all internal operations version 1.
|
[feat]: change erasure coding default block size from 10MiB to 1MiB (#11721)
major performance improvements in range GETs to avoid large
read amplification when ranges are tiny and random
```
-------------------
Operation: GET
Operations: 142014 -> 339421
Duration: 4m50s -> 4m56s
* Average: +139.41% (+1177.3 MiB/s) throughput, +139.11% (+658.4) obj/s
* Fastest: +125.24% (+1207.4 MiB/s) throughput, +132.32% (+612.9) obj/s
* 50% Median: +139.06% (+1175.7 MiB/s) throughput, +133.46% (+660.9) obj/s
* Slowest: +203.40% (+1267.9 MiB/s) throughput, +198.59% (+753.5) obj/s
```
TTFB from 10MiB BlockSize
```
* First Access TTFB: Avg: 81ms, Median: 61ms, Best: 20ms, Worst: 2.056s
```
TTFB from 1MiB BlockSize
```
* First Access TTFB: Avg: 22ms, Median: 21ms, Best: 8ms, Worst: 91ms
```
Full object reads however do see a slight change which won't be
noticeable in real world, so not doing any comparisons
TTFB still had improvements with full object reads with 1MiB
```
* First Access TTFB: Avg: 68ms, Median: 35ms, Best: 11ms, Worst: 1.16s
```
v/s
TTFB with 10MiB
```
* First Access TTFB: Avg: 388ms, Median: 98ms, Best: 20ms, Worst: 4.156s
```
This change should affect all new uploads, previous uploads should
continue to work with business as usual. But dramatic improvements can
be seen with these changes.
2021-03-06 14:09:34 -08:00
|
|
|
|
|
|
|
// TLDR..
|
|
|
|
// Not used anymore xl.meta captures the right blockSize
|
|
|
|
// so blockSizeV2 should be used for all future purposes.
|
|
|
|
// this value is kept here to calculate the max API
|
|
|
|
// requests based on RAM size for existing content.
|
2016-11-22 18:18:22 -08:00
|
|
|
blockSizeV1 = 10 * humanize.MiByte
|
2016-06-25 15:33:27 +05:30
|
|
|
|
[feat]: change erasure coding default block size from 10MiB to 1MiB (#11721)
major performance improvements in range GETs to avoid large
read amplification when ranges are tiny and random
```
-------------------
Operation: GET
Operations: 142014 -> 339421
Duration: 4m50s -> 4m56s
* Average: +139.41% (+1177.3 MiB/s) throughput, +139.11% (+658.4) obj/s
* Fastest: +125.24% (+1207.4 MiB/s) throughput, +132.32% (+612.9) obj/s
* 50% Median: +139.06% (+1175.7 MiB/s) throughput, +133.46% (+660.9) obj/s
* Slowest: +203.40% (+1267.9 MiB/s) throughput, +198.59% (+753.5) obj/s
```
TTFB from 10MiB BlockSize
```
* First Access TTFB: Avg: 81ms, Median: 61ms, Best: 20ms, Worst: 2.056s
```
TTFB from 1MiB BlockSize
```
* First Access TTFB: Avg: 22ms, Median: 21ms, Best: 8ms, Worst: 91ms
```
Full object reads however do see a slight change which won't be
noticeable in real world, so not doing any comparisons
TTFB still had improvements with full object reads with 1MiB
```
* First Access TTFB: Avg: 68ms, Median: 35ms, Best: 11ms, Worst: 1.16s
```
v/s
TTFB with 10MiB
```
* First Access TTFB: Avg: 388ms, Median: 98ms, Best: 20ms, Worst: 4.156s
```
This change should affect all new uploads, previous uploads should
continue to work with business as usual. But dramatic improvements can
be seen with these changes.
2021-03-06 14:09:34 -08:00
|
|
|
// Block size used in erasure coding version 2.
|
|
|
|
blockSizeV2 = 1 * humanize.MiByte
|
|
|
|
|
2016-07-21 17:31:14 -07:00
|
|
|
// Buckets meta prefix.
|
|
|
|
bucketMetaPrefix = "buckets"
|
2017-04-11 08:21:23 +05:30
|
|
|
|
2022-07-25 17:51:32 -07:00
|
|
|
// Deleted Buckets prefix.
|
|
|
|
deletedBucketsPrefix = ".deleted"
|
|
|
|
|
2017-05-14 12:05:51 -07:00
|
|
|
// ETag (hex encoded md5sum) of empty string.
|
|
|
|
emptyETag = "d41d8cd98f00b204e9800998ecf8427e"
|
2016-05-29 15:38:14 -07:00
|
|
|
)
|
|
|
|
|
2016-10-09 23:03:10 -07:00
|
|
|
// Global object layer mutex, used for safely updating object layer.
|
2020-05-03 22:35:40 -07:00
|
|
|
var globalObjLayerMutex sync.RWMutex
|
2016-10-09 23:03:10 -07:00
|
|
|
|
2019-10-30 23:39:09 -07:00
|
|
|
// Global object layer, only accessed by globalObjectAPI.
|
2016-10-09 23:03:10 -07:00
|
|
|
var globalObjectAPI ObjectLayer
|
|
|
|
|
2021-11-16 09:28:29 -08:00
|
|
|
// Global cacheObjects, only accessed by newCacheObjectsFn().
|
2018-03-28 14:14:06 -07:00
|
|
|
var globalCacheObjectAPI CacheObjectLayer
|
|
|
|
|
2023-08-01 10:54:26 -07:00
|
|
|
type storageOpts struct {
|
|
|
|
cleanUp bool
|
|
|
|
healthCheck bool
|
|
|
|
}
|
|
|
|
|
2016-06-02 01:49:46 -07:00
|
|
|
// Depending on the disk type network or local, initialize storage API.
|
2023-08-01 10:54:26 -07:00
|
|
|
func newStorageAPI(endpoint Endpoint, opts storageOpts) (storage StorageAPI, err error) {
|
2017-04-12 04:14:27 +05:30
|
|
|
if endpoint.IsLocal {
|
2023-08-01 10:54:26 -07:00
|
|
|
storage, err := newXLStorage(endpoint, opts.cleanUp)
|
2019-10-25 10:37:53 -07:00
|
|
|
if err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
2023-08-01 10:54:26 -07:00
|
|
|
return newXLStorageDiskIDCheck(storage, opts.healthCheck), nil
|
2016-06-02 01:49:46 -07:00
|
|
|
}
|
2017-04-12 04:14:27 +05:30
|
|
|
|
2023-08-01 10:54:26 -07:00
|
|
|
return newStorageRESTClient(endpoint, opts.healthCheck), nil
|
2016-06-02 01:49:46 -07:00
|
|
|
}
|