open-policy-agent · sspaink · Apr 15, 2025 · Apr 15, 2025 · Apr 15, 2025 · Apr 15, 2025
diff --git a/v1/plugins/logs/encoder.go b/v1/plugins/logs/encoder.go
@@ -28,14 +28,18 @@ const (
 // written to the encoder and the encoder outputs chunks that are fit to the
 // configured limit.
 type chunkEncoder struct {
-	limit                      int64
+	limit        int64
+	bytesWritten int
+	buf          *bytes.Buffer
+	w            *gzip.Writer
+	metrics      metrics.Metrics
+
+	// The soft limit is a dynamic limit that will maximize the amount of events that fit in each chunk.
+	// After creating a chunk it will determine if it should scale up and down based on the chunk size vs the limit.
+	// If the chunk didn't reach the limit perhaps future events could have been added.
 	softLimit                  int64
 	softLimitScaleUpExponent   float64
 	softLimitScaleDownExponent float64
-	bytesWritten               int
-	buf                        *bytes.Buffer
-	w                          *gzip.Writer
-	metrics                    metrics.Metrics
 }
 
 func newChunkEncoder(limit int64) *chunkEncoder {
@@ -141,18 +145,30 @@ func (enc *chunkEncoder) reset() ([][]byte, error) {
 	// decisions in the last chunk.
 	// 3) Equilibrium: If the chunk size is between 90% and 100% of the user-configured limit, maintain soft limit value.
 
-	if enc.buf.Len() < int(float64(enc.limit)*encHardLimitThreshold) {
+	if enc.bytesWritten < int(float64(enc.limit)*encHardLimitThreshold) {
 		if enc.metrics != nil {
 			enc.metrics.Counter(encSoftLimitScaleUpCounterName).Incr()
 		}
 
 		mul := int64(math.Pow(float64(softLimitBaseFactor), float64(enc.softLimitScaleUpExponent+1)))
+		// this can cause enc.softLimit to overflow into a negative value
 		enc.softLimit *= mul
 		enc.softLimitScaleUpExponent += softLimitExponentScaleFactor
+
+		// In Go an overflow wraps around using modulo arithmetic, so it could be negative.
+		// enc.limit*2 is the ceiling for the soft limit, unless that also overflows then it will be (math.MaxInt64 - 1).
+		if enc.softLimit < 0 || enc.softLimit > enc.limit*2 {
+			limit := enc.limit * 2
+			if limit < 0 {
+				limit = math.MaxInt64 - 1
+			}
+			enc.softLimit = limit
+			enc.softLimitScaleUpExponent = 0
+		}
 		return enc.update(), nil
 	}
 
-	if int(enc.limit) > enc.buf.Len() && enc.buf.Len() >= int(float64(enc.limit)*encHardLimitThreshold) {
+	if int(enc.limit) > enc.bytesWritten && enc.bytesWritten >= int(float64(enc.limit)*encHardLimitThreshold) {
 		if enc.metrics != nil {
 			enc.metrics.Counter(encSoftLimitStableCounterName).Incr()
 		}

diff --git a/v1/plugins/logs/encoder_test.go b/v1/plugins/logs/encoder_test.go
@@ -5,6 +5,7 @@
 package logs
 
 import (
+	"math"
 	"strconv"
 	"testing"
 	"time"
@@ -84,8 +85,9 @@ func TestChunkEncoderSizeLimit(t *testing.T) {
 }
 
 func TestChunkEncoderAdaptive(t *testing.T) {
-
-	enc := newChunkEncoder(1000).WithMetrics(metrics.New())
+	// limit is set to 1050, so that 90% is 945 which is larger than the event size of 936
+	// this will trigger the adaptive changing of the soft limit
+	enc := newChunkEncoder(1050).WithMetrics(metrics.New())
 	var result interface{} = false
 	var expInput interface{} = map[string]interface{}{"method": "GET"}
 	ts, err := time.Parse(time.RFC3339Nano, "2018-01-01T12:00:00.123456Z")
@@ -149,9 +151,9 @@ func TestChunkEncoderAdaptive(t *testing.T) {
 	actualScaleDownEvents := enc.metrics.Counter(encSoftLimitScaleDownCounterName).Value().(uint64)
 	actualEquiEvents := enc.metrics.Counter(encSoftLimitStableCounterName).Value().(uint64)
 
-	expectedScaleUpEvents := uint64(8)
-	expectedScaleDownEvents := uint64(3)
-	expectedEquiEvents := uint64(0)
+	expectedScaleUpEvents := uint64(25)
+	expectedScaleDownEvents := uint64(25)
+	expectedEquiEvents := uint64(75)
 
 	if actualScaleUpEvents != expectedScaleUpEvents {
 		t.Fatalf("Expected scale up events %v but got %v", expectedScaleUpEvents, actualScaleUpEvents)
@@ -179,3 +181,41 @@ func decodeChunks(t *testing.T, bs [][]byte) int {
 	}
 	return numEvents
 }
+
+func TestReset(t *testing.T) {
+	tests := []struct {
+		name              string
+		limit             int64
+		expectedSoftLimit int64
+	}{
+		{
+			name:              "limit 100",
+			limit:             100,
+			expectedSoftLimit: 200,
+		},
+		{
+			name:              "limit maxt int64 - 1 ",
+			limit:             math.MaxInt64 - 1,
+			expectedSoftLimit: math.MaxInt64 - 1,
+		},
+	}
+
+	for _, tc := range tests {
+		t.Run(tc.name, func(t *testing.T) {
+
+			enc := newChunkEncoder(tc.limit)
+
+			for range 100 {
+				_, err := enc.reset()
+				if err != nil {
+					t.Fatal(err)
+				}
+
+				if enc.softLimit != tc.expectedSoftLimit {
+					t.Fatalf("softLimit (%d) exceeds limit (%d)", enc.softLimit, tc.expectedSoftLimit)
+				}
+			}
+		})
+	}
+
+}
diff --git a/v1/plugins/logs/plugin_test.go b/v1/plugins/logs/plugin_test.go
@@ -408,7 +408,7 @@ func TestPluginStartSameInput(t *testing.T) {
 	fixture := newTestFixture(t)
 	defer fixture.server.stop()
 
-	fixture.server.ch = make(chan []EventV1, 3)
+	fixture.server.ch = make(chan []EventV1, 4)
 	var result interface{} = false
 
 	ts, err := time.Parse(time.RFC3339Nano, "2018-01-01T12:00:00.123456Z")
@@ -441,12 +441,15 @@ func TestPluginStartSameInput(t *testing.T) {
 	chunk1 := <-fixture.server.ch
 	chunk2 := <-fixture.server.ch
 	chunk3 := <-fixture.server.ch
+	chunk4 := <-fixture.server.ch
 	expLen1 := 122
-	expLen2 := 242
-	expLen3 := 36
+	expLen2 := 121
+	expLen3 := 121
+	expLen4 := 36
 
-	if len(chunk1) != expLen1 || len(chunk2) != expLen2 || len(chunk3) != expLen3 {
-		t.Fatalf("Expected chunk lens %v, %v, and %v but got: %v, %v, and %v", expLen1, expLen2, expLen3, len(chunk1), len(chunk2), len(chunk3))
+	if len(chunk1) != expLen1 || len(chunk2) != expLen2 || len(chunk3) != expLen3 || len(chunk4) != expLen4 {
+		t.Fatalf("Expected chunk lens %v, %v, %v and %v but got: %v, %v, %v and %v",
+			expLen1, expLen2, expLen3, expLen4, len(chunk1), len(chunk2), len(chunk3), len(chunk4))
 	}
 
 	var expInput interface{} = map[string]interface{}{"method": "GET"}
@@ -472,8 +475,8 @@ func TestPluginStartSameInput(t *testing.T) {
 		Metrics:     msAsFloat64,
 	}
 
-	if !reflect.DeepEqual(chunk3[expLen3-1], exp) {
-		t.Fatalf("Expected %+v but got %+v", exp, chunk3[expLen3-1])
+	if !reflect.DeepEqual(chunk4[expLen4-1], exp) {
+		t.Fatalf("Expected %+v but got %+v", exp, chunk4[expLen4-1])
 	}
 
 	if fixture.plugin.status.Code != "" {
@@ -489,7 +492,7 @@ func TestPluginStartChangingInputValues(t *testing.T) {
 	fixture := newTestFixture(t)
 	defer fixture.server.stop()
 
-	fixture.server.ch = make(chan []EventV1, 3)
+	fixture.server.ch = make(chan []EventV1, 4)
 	var result interface{} = false
 
 	ts, err := time.Parse(time.RFC3339Nano, "2018-01-01T12:00:00.123456Z")
@@ -521,12 +524,15 @@ func TestPluginStartChangingInputValues(t *testing.T) {
 	chunk1 := <-fixture.server.ch
 	chunk2 := <-fixture.server.ch
 	chunk3 := <-fixture.server.ch
+	chunk4 := <-fixture.server.ch
 	expLen1 := 124
-	expLen2 := 247
-	expLen3 := 29
+	expLen2 := 123
+	expLen3 := 123
+	expLen4 := 30
 
-	if len(chunk1) != expLen1 || len(chunk2) != expLen2 || len((chunk3)) != expLen3 {
-		t.Fatalf("Expected chunk lens %v, %v and %v but got: %v, %v and %v", expLen1, expLen2, expLen3, len(chunk1), len(chunk2), len(chunk3))
+	if len(chunk1) != expLen1 || len(chunk2) != expLen2 || len(chunk3) != expLen3 || len(chunk4) != expLen4 {
+		t.Fatalf("Expected chunk lens %v, %v, %v and %v but got: %v, %v, %v and %v",
+			expLen1, expLen2, expLen3, expLen4, len(chunk1), len(chunk2), len(chunk3), len(chunk4))
 	}
 
 	exp := EventV1{
@@ -544,8 +550,8 @@ func TestPluginStartChangingInputValues(t *testing.T) {
 		Timestamp:   ts,
 	}
 
-	if !reflect.DeepEqual(chunk3[expLen3-1], exp) {
-		t.Fatalf("Expected %+v but got %+v", exp, chunk3[expLen3-1])
+	if !reflect.DeepEqual(chunk4[expLen4-1], exp) {
+		t.Fatalf("Expected %+v but got %+v", exp, chunk4[expLen4-1])
 	}
 }
 
@@ -3564,6 +3570,8 @@ type testServer struct {
 }
 
 func (t *testServer) handle(w http.ResponseWriter, r *http.Request) {
+	t.t.Helper()
+
 	gr, err := gzip.NewReader(r.Body)
 	if err != nil {
 		t.t.Fatal(err)