fix: simplify passing auditLog eventType (#15278)

Rename Trigger -> Event to be a more appropriate
name for the audit event.

Bonus: fixes a bug in AddMRFWorker() it did not
cancel the waitgroup, leading to waitgroup leaks.
This commit is contained in:
Harshavardhana 2022-07-12 10:43:32 -07:00 committed by GitHub
parent b4eb74f5ff
commit 0a8b78cb84
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
8 changed files with 56 additions and 36 deletions

View File

@ -649,6 +649,7 @@ func (api objectAPIHandlers) DeleteMultipleObjectsHandler(w http.ResponseWriter,
dv := DeletedObjectReplicationInfo{ dv := DeletedObjectReplicationInfo{
DeletedObject: dobj, DeletedObject: dobj,
Bucket: bucket, Bucket: bucket,
EventType: ReplicateIncomingDelete,
} }
scheduleReplicationDelete(ctx, dv, objectAPI) scheduleReplicationDelete(ctx, dv, objectAPI)
} }

View File

@ -347,7 +347,7 @@ func checkReplicateDelete(ctx context.Context, bucket string, dobj ObjectToDelet
// target cluster, the object version is marked deleted on the source and hidden from listing. It is permanently // target cluster, the object version is marked deleted on the source and hidden from listing. It is permanently
// deleted from the source when the VersionPurgeStatus changes to "Complete", i.e after replication succeeds // deleted from the source when the VersionPurgeStatus changes to "Complete", i.e after replication succeeds
// on target. // on target.
func replicateDelete(ctx context.Context, dobj DeletedObjectReplicationInfo, objectAPI ObjectLayer, trigger string) { func replicateDelete(ctx context.Context, dobj DeletedObjectReplicationInfo, objectAPI ObjectLayer) {
var replicationStatus replication.StatusType var replicationStatus replication.StatusType
bucket := dobj.Bucket bucket := dobj.Bucket
versionID := dobj.DeleteMarkerVersionID versionID := dobj.DeleteMarkerVersionID
@ -358,7 +358,7 @@ func replicateDelete(ctx context.Context, dobj DeletedObjectReplicationInfo, obj
defer func() { defer func() {
replStatus := string(replicationStatus) replStatus := string(replicationStatus)
auditLogInternal(context.Background(), bucket, dobj.ObjectName, AuditLogOptions{ auditLogInternal(context.Background(), bucket, dobj.ObjectName, AuditLogOptions{
Trigger: trigger, Event: dobj.EventType,
APIName: ReplicateDeleteAPI, APIName: ReplicateDeleteAPI,
VersionID: versionID, VersionID: versionID,
Status: replStatus, Status: replStatus,
@ -857,7 +857,7 @@ func getReplicationAction(oi1 ObjectInfo, oi2 minio.ObjectInfo, opType replicati
// replicateObject replicates the specified version of the object to destination bucket // replicateObject replicates the specified version of the object to destination bucket
// The source object is then updated to reflect the replication status. // The source object is then updated to reflect the replication status.
func replicateObject(ctx context.Context, ri ReplicateObjectInfo, objectAPI ObjectLayer, trigger string) { func replicateObject(ctx context.Context, ri ReplicateObjectInfo, objectAPI ObjectLayer) {
var replicationStatus replication.StatusType var replicationStatus replication.StatusType
defer func() { defer func() {
if replicationStatus.Empty() { if replicationStatus.Empty() {
@ -868,7 +868,7 @@ func replicateObject(ctx context.Context, ri ReplicateObjectInfo, objectAPI Obje
replicationStatus = ri.ReplicationStatus replicationStatus = ri.ReplicationStatus
} }
auditLogInternal(ctx, ri.Bucket, ri.Name, AuditLogOptions{ auditLogInternal(ctx, ri.Bucket, ri.Name, AuditLogOptions{
Trigger: trigger, Event: ri.EventType,
APIName: ReplicateObjectAPI, APIName: ReplicateObjectAPI,
VersionID: ri.VersionID, VersionID: ri.VersionID,
Status: replicationStatus.String(), Status: replicationStatus.String(),
@ -990,6 +990,7 @@ func replicateObject(ctx context.Context, ri ReplicateObjectInfo, objectAPI Obje
// the target site is down. Leave it to scanner to catch up instead. // the target site is down. Leave it to scanner to catch up instead.
if rinfos.ReplicationStatus() != replication.Completed && ri.RetryCount < 1 { if rinfos.ReplicationStatus() != replication.Completed && ri.RetryCount < 1 {
ri.OpType = replication.HealReplicationType ri.OpType = replication.HealReplicationType
ri.EventType = ReplicateMRF
ri.ReplicationStatusInternal = rinfos.ReplicationStatusInternal() ri.ReplicationStatusInternal = rinfos.ReplicationStatusInternal()
ri.RetryCount++ ri.RetryCount++
globalReplicationPool.queueReplicaFailedTask(ri) globalReplicationPool.queueReplicaFailedTask(ri)
@ -1291,6 +1292,7 @@ func filterReplicationStatusMetadata(metadata map[string]string) map[string]stri
type DeletedObjectReplicationInfo struct { type DeletedObjectReplicationInfo struct {
DeletedObject DeletedObject
Bucket string Bucket string
EventType string
OpType replication.Type OpType replication.Type
ResetID string ResetID string
TargetArn string TargetArn string
@ -1313,12 +1315,15 @@ const (
// ReplicateMRF - audit trail for replication from Most Recent Failures (MRF) queue // ReplicateMRF - audit trail for replication from Most Recent Failures (MRF) queue
ReplicateMRF = "replicate:mrf" ReplicateMRF = "replicate:mrf"
// ReplicateIncoming - audit trail indicating replication started [could be from incoming/existing/heal activity] // ReplicateIncoming - audit trail of inline replication
ReplicateIncoming = "replicate:incoming" ReplicateIncoming = "replicate:incoming"
// ReplicateIncomingDelete - audit trail of inline replication of deletes.
ReplicateIncomingDelete = "replicate:incoming:delete"
// ReplicateHeal - audit trail for healing of failed/pending replications // ReplicateHeal - audit trail for healing of failed/pending replications
ReplicateHeal = "replicate:heal" ReplicateHeal = "replicate:heal"
// ReplicateDelete - audit trail for delete replication // ReplicateHealDelete - audit trail of healing of failed/pending delete replications.
ReplicateDelete = "replicate:delete" ReplicateHealDelete = "replicate:heal:delete"
) )
var ( var (
@ -1364,13 +1369,14 @@ func NewReplicationPool(ctx context.Context, o ObjectLayer, opts replicationPool
pool.ResizeWorkers(opts.Workers) pool.ResizeWorkers(opts.Workers)
pool.ResizeFailedWorkers(opts.FailedWorkers) pool.ResizeFailedWorkers(opts.FailedWorkers)
go pool.AddExistingObjectReplicateWorker() go pool.AddExistingObjectReplicateWorker()
go pool.periodicResyncMetaSave(ctx, o) go pool.updateResyncStatus(ctx, o)
return pool return pool
} }
// AddMRFWorker adds a pending/failed replication worker to handle requests that could not be queued // AddMRFWorker adds a pending/failed replication worker to handle requests that could not be queued
// to the other workers // to the other workers
func (p *ReplicationPool) AddMRFWorker() { func (p *ReplicationPool) AddMRFWorker() {
defer p.mrfWorkerWg.Done()
for { for {
select { select {
case <-p.ctx.Done(): case <-p.ctx.Done():
@ -1379,7 +1385,7 @@ func (p *ReplicationPool) AddMRFWorker() {
if !ok { if !ok {
return return
} }
replicateObject(p.ctx, oi, p.objLayer, ReplicateMRF) replicateObject(p.ctx, oi, p.objLayer)
case <-p.mrfWorkerKillCh: case <-p.mrfWorkerKillCh:
return return
} }
@ -1397,12 +1403,12 @@ func (p *ReplicationPool) AddWorker() {
if !ok { if !ok {
return return
} }
replicateObject(p.ctx, oi, p.objLayer, ReplicateIncoming) replicateObject(p.ctx, oi, p.objLayer)
case doi, ok := <-p.replicaDeleteCh: case doi, ok := <-p.replicaDeleteCh:
if !ok { if !ok {
return return
} }
replicateDelete(p.ctx, doi, p.objLayer, ReplicateDelete) replicateDelete(p.ctx, doi, p.objLayer)
case <-p.workerKillCh: case <-p.workerKillCh:
return return
} }
@ -1419,12 +1425,12 @@ func (p *ReplicationPool) AddExistingObjectReplicateWorker() {
if !ok { if !ok {
return return
} }
replicateObject(p.ctx, oi, p.objLayer, ReplicateExisting) replicateObject(p.ctx, oi, p.objLayer)
case doi, ok := <-p.existingReplicaDeleteCh: case doi, ok := <-p.existingReplicaDeleteCh:
if !ok { if !ok {
return return
} }
replicateDelete(p.ctx, doi, p.objLayer, ReplicateExistingDelete) replicateDelete(p.ctx, doi, p.objLayer)
} }
} }
} }
@ -1482,7 +1488,7 @@ func (p *ReplicationPool) queueReplicaFailedTask(ri ReplicateObjectInfo) {
}) })
case p.mrfReplicaCh <- ri: case p.mrfReplicaCh <- ri:
default: default:
logger.LogOnceIf(GlobalContext, fmt.Errorf("WARNING: Replication failed workers could not keep up with healing failures - consider increasing number of replication failed workers with `mc admin config set api replication_failed_workers=%d`", p.suggestedWorkers(true)), replicationSubsystem) logger.LogOnceIf(GlobalContext, fmt.Errorf("WARNING: Unable to keep up retrying failed replication - we recommend increasing number of replication failed workers with `mc admin config set api replication_failed_workers=%d`", p.suggestedWorkers(true)), replicationSubsystem)
} }
} }
@ -1508,7 +1514,7 @@ func (p *ReplicationPool) queueReplicaTask(ri ReplicateObjectInfo) {
}) })
case ch <- ri: case ch <- ri:
default: default:
logger.LogOnceIf(GlobalContext, fmt.Errorf("WARNING: Replication workers could not keep up with incoming traffic - consider increasing number of replication workers with `mc admin config set api replication_workers=%d`", p.suggestedWorkers(false)), replicationSubsystem) logger.LogOnceIf(GlobalContext, fmt.Errorf("WARNING: Unable to keep up with incoming traffic - we recommend increasing number of replicate object workers with `mc admin config set api replication_workers=%d`", p.suggestedWorkers(false)), replicationSubsystem)
} }
} }
@ -1545,7 +1551,7 @@ func (p *ReplicationPool) queueReplicaDeleteTask(doi DeletedObjectReplicationInf
}) })
case ch <- doi: case ch <- doi:
default: default:
logger.LogOnceIf(GlobalContext, fmt.Errorf("WARNING: Replication workers could not keep up with incoming traffic - consider increasing number of replication workers with `mc admin config set api replication_workers=%d`", p.suggestedWorkers(false)), replicationSubsystem) logger.LogOnceIf(GlobalContext, fmt.Errorf("WARNING: Unable to keep up with incoming deletes - we recommend increasing number of replicate workers with `mc admin config set api replication_workers=%d`", p.suggestedWorkers(false)), replicationSubsystem)
} }
} }
@ -1722,10 +1728,11 @@ func proxyHeadToReplicationTarget(ctx context.Context, bucket, object string, rs
} }
func scheduleReplication(ctx context.Context, objInfo ObjectInfo, o ObjectLayer, dsc ReplicateDecision, opType replication.Type) { func scheduleReplication(ctx context.Context, objInfo ObjectInfo, o ObjectLayer, dsc ReplicateDecision, opType replication.Type) {
ri := ReplicateObjectInfo{ObjectInfo: objInfo, OpType: opType, Dsc: dsc, EventType: ReplicateIncoming}
if dsc.Synchronous() { if dsc.Synchronous() {
replicateObject(ctx, ReplicateObjectInfo{ObjectInfo: objInfo, OpType: opType, Dsc: dsc}, o, ReplicateIncoming) replicateObject(ctx, ri, o)
} else { } else {
globalReplicationPool.queueReplicaTask(ReplicateObjectInfo{ObjectInfo: objInfo, OpType: opType, Dsc: dsc}) globalReplicationPool.queueReplicaTask(ri)
} }
if sz, err := objInfo.GetActualSize(); err == nil { if sz, err := objInfo.GetActualSize(); err == nil {
for arn := range dsc.targetsMap { for arn := range dsc.targetsMap {
@ -1956,10 +1963,10 @@ func getLatestReplicationStats(bucket string, u BucketUsageInfo) (s BucketReplic
return calculateBucketReplicationStats(bucket, u, bucketStats) return calculateBucketReplicationStats(bucket, u, bucketStats)
} }
const resyncTimeInterval = time.Minute * 10 const resyncTimeInterval = time.Minute * 1
// periodicResyncMetaSave saves in-memory resync meta stats to disk in periodic intervals // updateResyncStatus persists in-memory resync metadata stats to disk at periodic intervals
func (p *ReplicationPool) periodicResyncMetaSave(ctx context.Context, objectAPI ObjectLayer) { func (p *ReplicationPool) updateResyncStatus(ctx context.Context, objectAPI ObjectLayer) {
resyncTimer := time.NewTimer(resyncTimeInterval) resyncTimer := time.NewTimer(resyncTimeInterval)
defer resyncTimer.Stop() defer resyncTimer.Stop()
@ -2085,13 +2092,15 @@ func resyncBucket(ctx context.Context, bucket, arn string, heal bool, objectAPI
DeleteMarkerMTime: DeleteMarkerMTime{roi.ModTime}, DeleteMarkerMTime: DeleteMarkerMTime{roi.ModTime},
DeleteMarker: roi.DeleteMarker, DeleteMarker: roi.DeleteMarker,
}, },
Bucket: roi.Bucket, Bucket: roi.Bucket,
OpType: replication.ExistingObjectReplicationType, OpType: replication.ExistingObjectReplicationType,
EventType: ReplicateExistingDelete,
} }
replicateDelete(ctx, doi, objectAPI, ReplicateDelete) replicateDelete(ctx, doi, objectAPI)
} else { } else {
roi.OpType = replication.ExistingObjectReplicationType roi.OpType = replication.ExistingObjectReplicationType
replicateObject(ctx, roi, objectAPI, ReplicateExisting) roi.EventType = ReplicateExisting
replicateObject(ctx, roi, objectAPI)
} }
_, err = tgt.StatObject(ctx, tgt.Bucket, roi.Name, miniogo.StatObjectOptions{ _, err = tgt.StatObject(ctx, tgt.Bucket, roi.Name, miniogo.StatObjectOptions{
VersionID: roi.VersionID, VersionID: roi.VersionID,

View File

@ -1278,12 +1278,14 @@ func (i *scannerItem) healReplication(ctx context.Context, o ObjectLayer, oi Obj
switch oi.ReplicationStatus { switch oi.ReplicationStatus {
case replication.Pending, replication.Failed: case replication.Pending, replication.Failed:
roi.EventType = ReplicateHeal
globalReplicationPool.queueReplicaTask(roi) globalReplicationPool.queueReplicaTask(roi)
return return
case replication.Replica: case replication.Replica:
sizeS.replicaSize += oi.Size sizeS.replicaSize += oi.Size
} }
if roi.ExistingObjResync.mustResync() { if roi.ExistingObjResync.mustResync() {
roi.EventType = ReplicateExisting
globalReplicationPool.queueReplicaTask(roi) globalReplicationPool.queueReplicaTask(roi)
} }
} }
@ -1309,11 +1311,13 @@ func (i *scannerItem) healReplicationDeletes(ctx context.Context, o ObjectLayer,
DeleteMarkerMTime: DeleteMarkerMTime{roi.ModTime}, DeleteMarkerMTime: DeleteMarkerMTime{roi.ModTime},
DeleteMarker: roi.DeleteMarker, DeleteMarker: roi.DeleteMarker,
}, },
Bucket: roi.Bucket, Bucket: roi.Bucket,
OpType: replication.HealReplicationType, OpType: replication.HealReplicationType,
EventType: ReplicateHealDelete,
} }
if roi.ExistingObjResync.mustResync() { if roi.ExistingObjResync.mustResync() {
doi.OpType = replication.ExistingObjectReplicationType doi.OpType = replication.ExistingObjectReplicationType
doi.EventType = ReplicateExistingDelete
queueReplicateDeletesWrapper(doi, roi.ExistingObjResync) queueReplicateDeletesWrapper(doi, roi.ExistingObjResync)
return return
} }
@ -1476,9 +1480,9 @@ const (
ILMTransition = " ilm:transition" ILMTransition = " ilm:transition"
) )
func auditLogLifecycle(ctx context.Context, oi ObjectInfo, trigger string) { func auditLogLifecycle(ctx context.Context, oi ObjectInfo, event string) {
var apiName string var apiName string
switch trigger { switch event {
case ILMExpiry: case ILMExpiry:
apiName = "ILMExpiry" apiName = "ILMExpiry"
case ILMFreeVersionDelete: case ILMFreeVersionDelete:
@ -1487,7 +1491,7 @@ func auditLogLifecycle(ctx context.Context, oi ObjectInfo, trigger string) {
apiName = "ILMTransition" apiName = "ILMTransition"
} }
auditLogInternal(ctx, oi.Bucket, oi.Name, AuditLogOptions{ auditLogInternal(ctx, oi.Bucket, oi.Name, AuditLogOptions{
Trigger: trigger, Event: event,
APIName: apiName, APIName: apiName,
VersionID: oi.VersionID, VersionID: oi.VersionID,
}) })

View File

@ -1151,7 +1151,7 @@ func auditLogDecom(ctx context.Context, apiName, bucket, object, versionID strin
errStr = err.Error() errStr = err.Error()
} }
auditLogInternal(ctx, bucket, object, AuditLogOptions{ auditLogInternal(ctx, bucket, object, AuditLogOptions{
Trigger: "decommissioning", Event: "decommission",
APIName: apiName, APIName: apiName,
VersionID: versionID, VersionID: versionID,
Error: errStr, Error: errStr,

View File

@ -262,6 +262,7 @@ func (o ObjectInfo) tierStats() tierStats {
type ReplicateObjectInfo struct { type ReplicateObjectInfo struct {
ObjectInfo ObjectInfo
OpType replication.Type OpType replication.Type
EventType string
RetryCount uint32 RetryCount uint32
ResetID string ResetID string
Dsc ReplicateDecision Dsc ReplicateDecision

View File

@ -3567,7 +3567,8 @@ func (api objectAPIHandlers) DeleteObjectHandler(w http.ResponseWriter, r *http.
DeleteMarker: objInfo.DeleteMarker, DeleteMarker: objInfo.DeleteMarker,
ReplicationState: objInfo.getReplicationState(dsc.String(), opts.VersionID, false), ReplicationState: objInfo.getReplicationState(dsc.String(), opts.VersionID, false),
}, },
Bucket: bucket, Bucket: bucket,
EventType: ReplicateIncomingDelete,
} }
scheduleReplicationDelete(ctx, dobj, objectAPI) scheduleReplicationDelete(ctx, dobj, objectAPI)
} }

View File

@ -1036,7 +1036,7 @@ func totalNodeCount() uint64 {
// AuditLogOptions takes options for audit logging subsystem activity // AuditLogOptions takes options for audit logging subsystem activity
type AuditLogOptions struct { type AuditLogOptions struct {
Trigger string Event string
APIName string APIName string
Status string Status string
VersionID string VersionID string
@ -1046,7 +1046,8 @@ type AuditLogOptions struct {
// sends audit logs for internal subsystem activity // sends audit logs for internal subsystem activity
func auditLogInternal(ctx context.Context, bucket, object string, opts AuditLogOptions) { func auditLogInternal(ctx context.Context, bucket, object string, opts AuditLogOptions) {
entry := audit.NewEntry(globalDeploymentID) entry := audit.NewEntry(globalDeploymentID)
entry.Trigger = opts.Trigger entry.Trigger = opts.Event
entry.Event = opts.Event
entry.Error = opts.Error entry.Error = opts.Error
entry.API.Name = opts.APIName entry.API.Name = opts.APIName
entry.API.Bucket = bucket entry.API.Bucket = bucket

View File

@ -40,8 +40,11 @@ type Entry struct {
Version string `json:"version"` Version string `json:"version"`
DeploymentID string `json:"deploymentid,omitempty"` DeploymentID string `json:"deploymentid,omitempty"`
Time time.Time `json:"time"` Time time.Time `json:"time"`
Trigger string `json:"trigger"` Event string `json:"event"`
API struct { // deprecated replaced by 'Event', kept here for some
// time for backward compatibility with k8s Operator.
Trigger string `json:"trigger"`
API struct {
Name string `json:"name,omitempty"` Name string `json:"name,omitempty"`
Bucket string `json:"bucket,omitempty"` Bucket string `json:"bucket,omitempty"`
Object string `json:"object,omitempty"` Object string `json:"object,omitempty"`