add parallel workers in batch replication (#16609)

This commit is contained in:
Harshavardhana 2023-02-13 12:07:58 -08:00 committed by GitHub
parent ee6d96eb46
commit 31188e9327
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
4 changed files with 108 additions and 70 deletions

View File

@ -28,6 +28,8 @@ import (
"math/rand" "math/rand"
"net/http" "net/http"
"net/url" "net/url"
"runtime"
"strconv"
"strings" "strings"
"sync" "sync"
"time" "time"
@ -41,7 +43,9 @@ import (
"github.com/minio/minio/internal/auth" "github.com/minio/minio/internal/auth"
xhttp "github.com/minio/minio/internal/http" xhttp "github.com/minio/minio/internal/http"
"github.com/minio/minio/internal/logger" "github.com/minio/minio/internal/logger"
"github.com/minio/minio/internal/workers"
"github.com/minio/pkg/console" "github.com/minio/pkg/console"
"github.com/minio/pkg/env"
iampolicy "github.com/minio/pkg/iam/policy" iampolicy "github.com/minio/pkg/iam/policy"
"github.com/minio/pkg/wildcard" "github.com/minio/pkg/wildcard"
"gopkg.in/yaml.v2" "gopkg.in/yaml.v2"
@ -356,6 +360,8 @@ func (r *BatchJobReplicateV1) ReplicateToTarget(ctx context.Context, api ObjectL
// batchJobInfo current batch replication information // batchJobInfo current batch replication information
type batchJobInfo struct { type batchJobInfo struct {
mu sync.RWMutex `json:"-" msg:"-"`
Version int `json:"-" msg:"v"` Version int `json:"-" msg:"v"`
JobID string `json:"jobID" msg:"jid"` JobID string `json:"jobID" msg:"jid"`
JobType string `json:"jobType" msg:"jt"` JobType string `json:"jobType" msg:"jt"`
@ -425,6 +431,9 @@ func (ri *batchJobInfo) load(ctx context.Context, api ObjectLayer, job BatchJobR
return fmt.Errorf("batchRepl: unknown version: %d", binary.LittleEndian.Uint16(data[2:4])) return fmt.Errorf("batchRepl: unknown version: %d", binary.LittleEndian.Uint16(data[2:4]))
} }
ri.mu.Lock()
defer ri.mu.Unlock()
// OK, parse data. // OK, parse data.
if _, err = ri.UnmarshalMsg(data[4:]); err != nil { if _, err = ri.UnmarshalMsg(data[4:]); err != nil {
return err return err
@ -439,8 +448,11 @@ func (ri *batchJobInfo) load(ctx context.Context, api ObjectLayer, job BatchJobR
return nil return nil
} }
func (ri batchJobInfo) clone() batchJobInfo { func (ri *batchJobInfo) clone() *batchJobInfo {
return batchJobInfo{ ri.mu.RLock()
defer ri.mu.RUnlock()
return &batchJobInfo{
Version: ri.Version, Version: ri.Version,
JobID: ri.JobID, JobID: ri.JobID,
JobType: ri.JobType, JobType: ri.JobType,
@ -458,21 +470,6 @@ func (ri batchJobInfo) clone() batchJobInfo {
} }
} }
func (ri batchJobInfo) save(ctx context.Context, api ObjectLayer, jobLocation string) error {
data := make([]byte, 4, ri.Msgsize()+4)
// Initialize the header.
binary.LittleEndian.PutUint16(data[0:2], batchReplFormat)
binary.LittleEndian.PutUint16(data[2:4], batchReplVersion)
buf, err := ri.MarshalMsg(data)
if err != nil {
return err
}
return saveConfig(ctx, api, pathJoin(jobLocation, batchReplName), buf)
}
func (ri *batchJobInfo) countItem(size int64, dmarker, success bool) { func (ri *batchJobInfo) countItem(size int64, dmarker, success bool) {
if ri == nil { if ri == nil {
return return
@ -499,14 +496,28 @@ func (ri *batchJobInfo) updateAfter(ctx context.Context, api ObjectLayer, durati
return errInvalidArgument return errInvalidArgument
} }
now := UTCNow() now := UTCNow()
ri.mu.Lock()
if now.Sub(ri.LastUpdate) >= duration { if now.Sub(ri.LastUpdate) >= duration {
if serverDebugLog { if serverDebugLog {
console.Debugf("batchReplicate: persisting batchReplication info on drive: threshold:%s, batchRepl:%#v\n", now.Sub(ri.LastUpdate), ri) console.Debugf("batchReplicate: persisting batchReplication info on drive: threshold:%s, batchRepl:%#v\n", now.Sub(ri.LastUpdate), ri)
} }
ri.LastUpdate = now ri.LastUpdate = now
ri.Version = batchReplVersionV1 ri.Version = batchReplVersionV1
return ri.save(ctx, api, jobLocation)
data := make([]byte, 4, ri.Msgsize()+4)
// Initialize the header.
binary.LittleEndian.PutUint16(data[0:2], batchReplFormat)
binary.LittleEndian.PutUint16(data[2:4], batchReplVersion)
buf, err := ri.MarshalMsg(data)
ri.mu.Unlock()
if err != nil {
return err
} }
return saveConfig(ctx, api, pathJoin(jobLocation, batchReplName), buf)
}
ri.mu.Unlock()
return nil return nil
} }
@ -514,6 +525,10 @@ func (ri *batchJobInfo) trackCurrentBucketObject(bucket string, info ObjectInfo,
if ri == nil { if ri == nil {
return return
} }
ri.mu.Lock()
defer ri.mu.Unlock()
ri.Bucket = bucket ri.Bucket = bucket
ri.Object = info.Name ri.Object = info.Name
ri.countItem(info.Size, info.DeleteMarker, failed) ri.countItem(info.Size, info.DeleteMarker, failed)
@ -529,7 +544,7 @@ func (r *BatchJobReplicateV1) Start(ctx context.Context, api ObjectLayer, job Ba
if err := ri.load(ctx, api, job); err != nil { if err := ri.load(ctx, api, job); err != nil {
return err return err
} }
globalBatchJobsMetrics.save(job.ID, ri.clone()) globalBatchJobsMetrics.save(job.ID, ri)
lastObject := ri.Object lastObject := ri.Object
delay := job.Replicate.Flags.Retry.Delay delay := job.Replicate.Flags.Retry.Delay
@ -619,9 +634,22 @@ func (r *BatchJobReplicateV1) Start(ctx context.Context, api ObjectLayer, job Ba
return err return err
} }
workerSize, err := strconv.Atoi(env.Get("_MINIO_BATCH_REPLICATION_WORKERS", strconv.Itoa(runtime.GOMAXPROCS(0)/2)))
if err != nil {
return err
}
retryAttempts := ri.RetryAttempts retryAttempts := ri.RetryAttempts
retry := false retry := false
for attempts := 1; attempts <= retryAttempts; attempts++ { for attempts := 1; attempts <= retryAttempts; attempts++ {
attempts := attempts
wk, err := workers.New(workerSize)
if err != nil {
// invalid worker size.
return err
}
ctx, cancel := context.WithCancel(ctx) ctx, cancel := context.WithCancel(ctx)
results := make(chan ObjectInfo, 100) results := make(chan ObjectInfo, 100)
@ -635,13 +663,18 @@ func (r *BatchJobReplicateV1) Start(ctx context.Context, api ObjectLayer, job Ba
} }
for result := range results { for result := range results {
result := result
wk.Take()
go func() {
defer wk.Give()
stopFn := globalBatchJobsMetrics.trace(batchReplicationMetricObject, job.ID, attempts, result) stopFn := globalBatchJobsMetrics.trace(batchReplicationMetricObject, job.ID, attempts, result)
success := true success := true
if err := r.ReplicateToTarget(ctx, api, c, result, retry); err != nil { if err := r.ReplicateToTarget(ctx, api, c, result, retry); err != nil {
if isErrVersionNotFound(err) || isErrObjectNotFound(err) { if isErrVersionNotFound(err) || isErrObjectNotFound(err) {
// object must be deleted concurrently, allow // object must be deleted concurrently, allow
// these failures but do not count them // these failures but do not count them
continue return
} }
stopFn(err) stopFn(err)
logger.LogIf(ctx, err) logger.LogIf(ctx, err)
@ -650,16 +683,20 @@ func (r *BatchJobReplicateV1) Start(ctx context.Context, api ObjectLayer, job Ba
stopFn(nil) stopFn(nil)
} }
ri.trackCurrentBucketObject(r.Source.Bucket, result, success) ri.trackCurrentBucketObject(r.Source.Bucket, result, success)
globalBatchJobsMetrics.save(job.ID, ri.clone()) globalBatchJobsMetrics.save(job.ID, ri)
// persist in-memory state to disk after every 10secs. // persist in-memory state to disk after every 10secs.
logger.LogIf(ctx, ri.updateAfter(ctx, api, 10*time.Second, job.Location)) logger.LogIf(ctx, ri.updateAfter(ctx, api, 10*time.Second, job.Location))
}()
} }
wk.Wait()
ri.RetryAttempts = attempts ri.RetryAttempts = attempts
ri.Complete = ri.ObjectsFailed == 0 ri.Complete = ri.ObjectsFailed == 0
ri.Failed = ri.ObjectsFailed > 0 ri.Failed = ri.ObjectsFailed > 0
globalBatchJobsMetrics.save(job.ID, ri.clone()) globalBatchJobsMetrics.save(job.ID, ri)
// persist in-memory state to disk.
logger.LogIf(ctx, ri.updateAfter(ctx, api, 0, job.Location))
buf, _ := json.Marshal(ri) buf, _ := json.Marshal(ri)
if err := r.Notify(ctx, bytes.NewReader(buf)); err != nil { if err := r.Notify(ctx, bytes.NewReader(buf)); err != nil {
@ -1135,11 +1172,11 @@ func (j *BatchJobPool) queueJob(req *BatchJobRequest) error {
//msgp:ignore batchJobMetrics //msgp:ignore batchJobMetrics
type batchJobMetrics struct { type batchJobMetrics struct {
sync.RWMutex sync.RWMutex
metrics map[string]batchJobInfo metrics map[string]*batchJobInfo
} }
var globalBatchJobsMetrics = batchJobMetrics{ var globalBatchJobsMetrics = batchJobMetrics{
metrics: make(map[string]batchJobInfo), metrics: make(map[string]*batchJobInfo),
} }
//msgp:ignore batchReplicationMetric //msgp:ignore batchReplicationMetric
@ -1207,11 +1244,11 @@ func (m *batchJobMetrics) delete(jobID string) {
delete(m.metrics, jobID) delete(m.metrics, jobID)
} }
func (m *batchJobMetrics) save(jobID string, ri batchJobInfo) { func (m *batchJobMetrics) save(jobID string, ri *batchJobInfo) {
m.Lock() m.Lock()
defer m.Unlock() defer m.Unlock()
m.metrics[jobID] = ri m.metrics[jobID] = ri.clone()
} }
func (m *batchJobMetrics) trace(d batchReplicationMetric, job string, attempts int, info ObjectInfo) func(err error) { func (m *batchJobMetrics) trace(d batchReplicationMetric, job string, attempts int, info ObjectInfo) func(err error) {

View File

@ -898,8 +898,9 @@ func (z *erasureServerPools) decommissionPool(ctx context.Context, idx int, pool
defer wg.Done() defer wg.Done()
err := set.listObjectsToDecommission(ctx, bi, err := set.listObjectsToDecommission(ctx, bi,
func(entry metaCacheEntry) { func(entry metaCacheEntry) {
parallelWorkers <- struct{}{} // Wait must be synchronized here.
wg.Add(1) wg.Add(1)
parallelWorkers <- struct{}{}
go decommissionEntry(entry) go decommissionEntry(entry)
}, },
) )

View File

@ -1,4 +1,4 @@
// Copyright (c) 2022 MinIO, Inc. // Copyright (c) 2022-2023 MinIO, Inc.
// //
// This file is part of MinIO Object Storage stack // This file is part of MinIO Object Storage stack
// //
@ -15,49 +15,49 @@
// You should have received a copy of the GNU Affero General Public License // You should have received a copy of the GNU Affero General Public License
// along with this program. If not, see <http://www.gnu.org/licenses/>. // along with this program. If not, see <http://www.gnu.org/licenses/>.
package jobtokens package workers
import ( import (
"errors" "errors"
"sync" "sync"
) )
// JobTokens provides a bounded semaphore with the ability to wait until all // Workers provides a bounded semaphore with the ability to wait until all
// concurrent jobs finish. // concurrent jobs finish.
type JobTokens struct { type Workers struct {
wg sync.WaitGroup wg sync.WaitGroup
tokens chan struct{} queue chan struct{}
} }
// New creates a JobTokens object which allows up to n jobs to proceed // New creates a Workers object which allows up to n jobs to proceed
// concurrently. n must be > 0. // concurrently. n must be > 0.
func New(n int) (*JobTokens, error) { func New(n int) (*Workers, error) {
if n <= 0 { if n <= 0 {
return nil, errors.New("n must be > 0") return nil, errors.New("n must be > 0")
} }
tokens := make(chan struct{}, n) queue := make(chan struct{}, n)
for i := 0; i < n; i++ { for i := 0; i < n; i++ {
tokens <- struct{}{} queue <- struct{}{}
} }
return &JobTokens{ return &Workers{
tokens: tokens, queue: queue,
}, nil }, nil
} }
// Take is how a job (goroutine) can Take its turn. // Take is how a job (goroutine) can Take its turn.
func (jt *JobTokens) Take() { func (jt *Workers) Take() {
jt.wg.Add(1) jt.wg.Add(1)
<-jt.tokens <-jt.queue
} }
// Give is how a job (goroutine) can give back its turn once done. // Give is how a job (goroutine) can give back its turn once done.
func (jt *JobTokens) Give() { func (jt *Workers) Give() {
jt.queue <- struct{}{}
jt.wg.Done() jt.wg.Done()
jt.tokens <- struct{}{}
} }
// Wait waits for all ongoing concurrent jobs to complete // Wait waits for all ongoing concurrent jobs to complete
func (jt *JobTokens) Wait() { func (jt *Workers) Wait() {
jt.wg.Wait() jt.wg.Wait()
} }

View File

@ -1,4 +1,4 @@
// Copyright (c) 2022 MinIO, Inc. // Copyright (c) 2022-2023 MinIO, Inc.
// //
// This file is part of MinIO Object Storage stack // This file is part of MinIO Object Storage stack
// //
@ -15,7 +15,7 @@
// You should have received a copy of the GNU Affero General Public License // You should have received a copy of the GNU Affero General Public License
// along with this program. If not, see <http://www.gnu.org/licenses/>. // along with this program. If not, see <http://www.gnu.org/licenses/>.
package jobtokens package workers
import ( import (
"fmt" "fmt"
@ -23,7 +23,7 @@ import (
"testing" "testing"
) )
func TestJobTokens(t *testing.T) { func TestWorkers(t *testing.T) {
tests := []struct { tests := []struct {
n int n int
jobs int jobs int
@ -59,7 +59,7 @@ func TestJobTokens(t *testing.T) {
testFn := func(n, jobs int, mustFail bool) { testFn := func(n, jobs int, mustFail bool) {
var mu sync.Mutex var mu sync.Mutex
var jobsDone int var jobsDone int
// Create jobTokens for n concurrent workers // Create workers for n concurrent workers
jt, err := New(n) jt, err := New(n)
if err == nil && mustFail { if err == nil && mustFail {
t.Fatal("Expected test to return error") t.Fatal("Expected test to return error")
@ -92,8 +92,8 @@ func TestJobTokens(t *testing.T) {
}) })
} }
// Verify that jobTokens can be reused after full drain // Verify that workers can be reused after full drain
t.Run("test-jobTokens-reuse", func(t *testing.T) { t.Run("test-workers-reuse", func(t *testing.T) {
var mu sync.Mutex var mu sync.Mutex
jt, _ := New(5) jt, _ := New(5)
for reuse := 0; reuse < 3; reuse++ { for reuse := 0; reuse < 3; reuse++ {
@ -115,7 +115,7 @@ func TestJobTokens(t *testing.T) {
}) })
} }
func benchmarkJobTokens(b *testing.B, n, jobs int) { func benchmarkWorkers(b *testing.B, n, jobs int) {
b.ReportAllocs() b.ReportAllocs()
b.RunParallel(func(pb *testing.PB) { b.RunParallel(func(pb *testing.PB) {
for pb.Next() { for pb.Next() {
@ -139,10 +139,10 @@ func benchmarkJobTokens(b *testing.B, n, jobs int) {
}) })
} }
func BenchmarkJobTokens_N5_J10(b *testing.B) { func BenchmarkWorkers_N5_J10(b *testing.B) {
benchmarkJobTokens(b, 5, 10) benchmarkWorkers(b, 5, 10)
} }
func BenchmarkJobTokens_N5_J100(b *testing.B) { func BenchmarkWorkers_N5_J100(b *testing.B) {
benchmarkJobTokens(b, 5, 100) benchmarkWorkers(b, 5, 100)
} }