Add Audit target metrics (#16044)

2025-11-08 21:24:55 -05:00 · 2022-11-10 19:20:21 +01:00
parent 34d28dd79f
commit 5b242f1d11
8 changed files with 233 additions and 32 deletions
--- a/internal/logger/target/http/http.go
+++ b/internal/logger/target/http/http.go
@@ -26,14 +26,20 @@ import (
 	"net/http"
 	"strings"
 	"sync"
+	"sync/atomic"
 	"time"

 	xhttp "github.com/minio/minio/internal/http"
 	"github.com/minio/minio/internal/logger/target/types"
 )

-// Timeout for the webhook http call
-const webhookCallTimeout = 5 * time.Second
+const (
+	// Timeout for the webhook http call
+	webhookCallTimeout = 5 * time.Second
+
+	// maxWorkers is the maximum number of concurrent operations.
+	maxWorkers = 8
+)

 // Config http logger target
 type Config struct {
@@ -57,6 +63,14 @@ type Config struct {
 // buffer is full, new logs are just ignored and an error
 // is returned to the caller.
 type Target struct {
+	totalMessages  int64
+	failedMessages int64
+
+	// Worker control
+	workers       int64
+	workerStartMu sync.Mutex
+	lastStarted   time.Time
+
 	wg     sync.WaitGroup
 	doneCh chan struct{}

@@ -64,6 +78,7 @@ type Target struct {
 	logCh chan interface{}

 	config Config
+	client *http.Client
 }

 // Endpoint returns the backend endpoint
@@ -75,6 +90,15 @@ func (h *Target) String() string {
 	return h.config.Name
 }

+// Stats returns the target statistics.
+func (h *Target) Stats() types.TargetStats {
+	return types.TargetStats{
+		TotalMessages:  atomic.LoadInt64(&h.totalMessages),
+		FailedMessages: atomic.LoadInt64(&h.failedMessages),
+		QueueLength:    len(h.logCh),
+	}
+}
+
 // Init validate and initialize the http target
 func (h *Target) Init() error {
 	ctx, cancel := context.WithTimeout(context.Background(), 2*webhookCallTimeout)
@@ -100,6 +124,7 @@ func (h *Target) Init() error {
 	if err != nil {
 		return err
 	}
+	h.client = &client

 	// Drain any response.
 	xhttp.DrainBody(resp.Body)
@@ -114,6 +139,8 @@ func (h *Target) Init() error {
 			h.config.Endpoint, resp.Status)
 	}

+	h.lastStarted = time.Now()
+	atomic.AddInt64(&h.workers, 1)
 	go h.startHTTPLogger()
 	return nil
 }
@@ -128,15 +155,17 @@ func acceptedResponseStatusCode(code int) bool {
 func (h *Target) logEntry(entry interface{}) {
 	logJSON, err := json.Marshal(&entry)
 	if err != nil {
+		atomic.AddInt64(&h.failedMessages, 1)
 		return
 	}

 	ctx, cancel := context.WithTimeout(context.Background(), webhookCallTimeout)
+	defer cancel()
 	req, err := http.NewRequestWithContext(ctx, http.MethodPost,
 		h.config.Endpoint, bytes.NewReader(logJSON))
 	if err != nil {
 		h.config.LogOnce(ctx, fmt.Errorf("%s returned '%w', please check your endpoint configuration", h.config.Endpoint, err), h.config.Endpoint)
-		cancel()
+		atomic.AddInt64(&h.failedMessages, 1)
 		return
 	}
 	req.Header.Set(xhttp.ContentType, "application/json")
@@ -151,10 +180,9 @@ func (h *Target) logEntry(entry interface{}) {
 		req.Header.Set("Authorization", h.config.AuthToken)
 	}

-	client := http.Client{Transport: h.config.Transport}
-	resp, err := client.Do(req)
-	cancel()
+	resp, err := h.client.Do(req)
 	if err != nil {
+		atomic.AddInt64(&h.failedMessages, 1)
 		h.config.LogOnce(ctx, fmt.Errorf("%s returned '%w', please check your endpoint configuration", h.config.Endpoint, err), h.config.Endpoint)
 		return
 	}
@@ -163,6 +191,7 @@ func (h *Target) logEntry(entry interface{}) {
 	xhttp.DrainBody(resp.Body)

 	if !acceptedResponseStatusCode(resp.StatusCode) {
+		atomic.AddInt64(&h.failedMessages, 1)
 		switch resp.StatusCode {
 		case http.StatusForbidden:
 			h.config.LogOnce(ctx, fmt.Errorf("%s returned '%s', please check if your auth token is correctly set", h.config.Endpoint, resp.Status), h.config.Endpoint)
@@ -177,11 +206,15 @@ func (h *Target) startHTTPLogger() {
 	// from an internal channel.
 	h.wg.Add(1)
 	go func() {
-		defer h.wg.Done()
+		defer func() {
+			h.wg.Done()
+			atomic.AddInt64(&h.workers, -1)
+		}()

 		for {
 			select {
 			case entry := <-h.logCh:
+				atomic.AddInt64(&h.totalMessages, 1)
 				h.logEntry(entry)
 			case <-h.doneCh:
 				return
@@ -214,8 +247,30 @@ func (h *Target) Send(entry interface{}) error {
 	case <-h.doneCh:
 	case h.logCh <- entry:
 	default:
+		nWorkers := atomic.LoadInt64(&h.workers)
+		if nWorkers < maxWorkers {
+			// Only have one try to start at the same time.
+			h.workerStartMu.Lock()
+			defer h.workerStartMu.Unlock()
+			// Start one max every second.
+			if time.Since(h.lastStarted) > time.Second {
+				if atomic.CompareAndSwapInt64(&h.workers, nWorkers, nWorkers+1) {
+					// Start another logger.
+					h.lastStarted = time.Now()
+					go h.startHTTPLogger()
+				}
+			}
+			// Block to send
+			select {
+			case <-h.doneCh:
+			case h.logCh <- entry:
+			}
+			return nil
+		}
 		// log channel is full, do not wait and return
 		// an error immediately to the caller
+		atomic.AddInt64(&h.totalMessages, 1)
+		atomic.AddInt64(&h.failedMessages, 1)
 		return errors.New("log buffer full")
 	}

--- a/internal/logger/target/kafka/kafka.go
+++ b/internal/logger/target/kafka/kafka.go
@@ -25,6 +25,7 @@ import (
 	"errors"
 	"net"
 	"sync"
+	"sync/atomic"

 	"github.com/Shopify/sarama"
 	saramatls "github.com/Shopify/sarama/tools/tls"
@@ -36,11 +37,14 @@ import (

 // Target - Kafka target.
 type Target struct {
+	totalMessages  int64
+	failedMessages int64
+
 	wg     sync.WaitGroup
 	doneCh chan struct{}

 	// Channel of log entries
-	logCh chan interface{}
+	logCh chan audit.Entry

 	producer sarama.SyncProducer
 	kconfig  Config
@@ -55,37 +59,40 @@ func (h *Target) Send(entry interface{}) error {
 	default:
 	}

-	select {
-	case <-h.doneCh:
-	case h.logCh <- entry:
-	default:
-		// log channel is full, do not wait and return
-		// an error immediately to the caller
-		return errors.New("log buffer full")
+	if e, ok := entry.(audit.Entry); ok {
+		select {
+		case <-h.doneCh:
+		case h.logCh <- e:
+		default:
+			// log channel is full, do not wait and return
+			// an error immediately to the caller
+			atomic.AddInt64(&h.totalMessages, 1)
+			atomic.AddInt64(&h.failedMessages, 1)
+			return errors.New("log buffer full")
+		}
 	}

 	return nil
 }

-func (h *Target) logEntry(entry interface{}) {
+func (h *Target) logEntry(entry audit.Entry) {
+	atomic.AddInt64(&h.totalMessages, 1)
 	logJSON, err := json.Marshal(&entry)
 	if err != nil {
+		atomic.AddInt64(&h.failedMessages, 1)
 		return
 	}
+	msg := sarama.ProducerMessage{
+		Topic: h.kconfig.Topic,
+		Key:   sarama.StringEncoder(entry.RequestID),
+		Value: sarama.ByteEncoder(logJSON),
+	}

-	ae, ok := entry.(audit.Entry)
-	if ok {
-		msg := sarama.ProducerMessage{
-			Topic: h.kconfig.Topic,
-			Key:   sarama.StringEncoder(ae.RequestID),
-			Value: sarama.ByteEncoder(logJSON),
-		}
-
-		_, _, err = h.producer.SendMessage(&msg)
-		if err != nil {
-			h.kconfig.LogOnce(context.Background(), err, h.kconfig.Topic)
-			return
-		}
+	_, _, err = h.producer.SendMessage(&msg)
+	if err != nil {
+		atomic.AddInt64(&h.failedMessages, 1)
+		h.kconfig.LogOnce(context.Background(), err, h.kconfig.Topic)
+		return
 	}
 }

@@ -147,6 +154,15 @@ func (k Config) pingBrokers() error {
 	return err
 }

+// Stats returns the target statistics.
+func (h *Target) Stats() types.TargetStats {
+	return types.TargetStats{
+		TotalMessages:  atomic.LoadInt64(&h.totalMessages),
+		FailedMessages: atomic.LoadInt64(&h.failedMessages),
+		QueueLength:    len(h.logCh),
+	}
+}
+
 // Endpoint - return kafka target
 func (h *Target) Endpoint() string {
 	return "kafka"
@@ -231,7 +247,7 @@ func (h *Target) Cancel() {
 // sends log over http to the specified endpoint
 func New(config Config) *Target {
 	target := &Target{
-		logCh:   make(chan interface{}, 10000),
+		logCh:   make(chan audit.Entry, 10000),
 		doneCh:  make(chan struct{}),
 		kconfig: config,
 	}
--- a/internal/logger/target/types/targettype_string.go
+++ b/internal/logger/target/types/targettype_string.go
@@ -0,0 +1,26 @@
+// Code generated by "stringer -type=TargetType -trimprefix=Target types.go"; DO NOT EDIT.
+
+package types
+
+import "strconv"
+
+func _() {
+	// An "invalid array index" compiler error signifies that the constant values have changed.
+	// Re-run the stringer command to generate them again.
+	var x [1]struct{}
+	_ = x[TargetConsole-1]
+	_ = x[TargetHTTP-2]
+	_ = x[TargetKafka-3]
+}
+
+const _TargetType_name = "ConsoleHTTPKafka"
+
+var _TargetType_index = [...]uint8{0, 7, 11, 16}
+
+func (i TargetType) String() string {
+	i -= 1
+	if i >= TargetType(len(_TargetType_index)-1) {
+		return "TargetType(" + strconv.FormatInt(int64(i+1), 10) + ")"
+	}
+	return _TargetType_name[_TargetType_index[i]:_TargetType_index[i+1]]
+}
--- a/internal/logger/target/types/types.go
+++ b/internal/logger/target/types/types.go
@@ -20,6 +20,8 @@ package types
 // TargetType indicates type of the target e.g. console, http, kafka
 type TargetType uint8

+//go:generate stringer -type=TargetType -trimprefix=Target $GOFILE
+
 // Constants for target types
 const (
 	_ TargetType = iota
@@ -27,3 +29,15 @@ const (
 	TargetHTTP
 	TargetKafka
 )
+
+// TargetStats contains statistics for a target.
+type TargetStats struct {
+	// QueueLength is the queue length if any messages are queued.
+	QueueLength int
+
+	// TotalMessages is the total number of messages sent in the lifetime of the target
+	TotalMessages int64
+
+	// FailedMessages should log message count that failed to send.
+	FailedMessages int64
+}