credentials/alts: Pool write buffers (#8919)

arjan-bal · web-flow · commit 7136e99ee323 · 2026-02-25T10:52:06.000+05:30
Fixes: #8906 This change removes the fixed-size read buffer used by each ALTS connection. A new, internal "dirty" buffer pool is introduced to allow fetching buffers without the overhead of clearing them first. This PR also addresses a few comments from #8910 that were not pushed before that PR was merged. ## Results A new micro-benchmark was added to measure memory usage by a `conn`, demonstrating a ~40% reduction in memory usage. Existing performance benchmark shows no regressions. ``` goos: linux goarch: amd64 pkg: google.golang.org/grpc/credentials/alts/internal/conn cpu: Intel(R) Xeon(R) CPU @ 2.60GHz │ old.txt │ new.txt │ │ sec/op │ sec/op vs base │ LargeMessage-48 80.81m ± ∞ ¹ 79.96m ± ∞ ¹ ~ (p=0.548 n=5) MemoryUsage-48 25.45µ ± ∞ ¹ 14.29µ ± ∞ ¹ -43.85% (p=0.008 n=5) geomean 1.434m 1.069m -25.46% ¹ need >= 6 samples for confidence interval at level 0.95 │ old.txt │ new.txt │ │ B/op │ B/op vs base │ LargeMessage-48 4.582Mi ± ∞ ¹ 4.578Mi ± ∞ ¹ -0.08% (p=0.008 n=5) MemoryUsage-48 147.16Ki ± ∞ ¹ 83.33Ki ± ∞ ¹ -43.38% (p=0.008 n=5) geomean 830.9Ki 625.0Ki -24.78% ¹ need >= 6 samples for confidence interval at level 0.95 │ old.txt │ new.txt │ │ allocs/op │ allocs/op vs base │ LargeMessage-48 2.000 ± ∞ ¹ 2.000 ± ∞ ¹ ~ (p=1.000 n=5) ² MemoryUsage-48 20.00 ± ∞ ¹ 18.00 ± ∞ ¹ -10.00% (p=0.008 n=5) geomean 6.325 6.000 -5.13% ¹ need >= 6 samples for confidence interval at level 0.95 ² all samples are equal ``` RELEASE NOTES: * credentials/alts: Pool write buffers to reduce memory usage
diff --git a/credentials/alts/internal/conn/record.go b/credentials/alts/internal/conn/record.go
@@ -27,6 +27,7 @@ import (
 	"net"
 
 	core "google.golang.org/grpc/credentials/alts/internal"
+	"google.golang.org/grpc/internal/mem"
 )
 
 // ALTSRecordCrypto is the interface for gRPC ALTS record protocol.
@@ -62,8 +63,6 @@ const (
 	altsRecordDefaultLength = 4 * 1024 // 4KiB
 	// Message type value included in ALTS record framing.
 	altsRecordMsgType = uint32(0x06)
-	// The initial write buffer size.
-	altsWriteBufferInitialSize = 32 * 1024 // 32KiB
 	// The maximum write buffer size. This *must* be multiple of
 	// altsRecordDefaultLength.
 	altsWriteBufferMaxSize = 512 * 1024 // 512KiB
@@ -74,9 +73,26 @@ const (
 )
 
 var (
-	protocols = make(map[string]ALTSRecordFunc)
+	protocols    = make(map[string]ALTSRecordFunc)
+	writeBufPool *mem.BinaryTieredBufferPool
 )
 
+func init() {
+	pool, err := mem.NewDirtyBinaryTieredBufferPool(
+		8,
+		12, // Go page size, 4KB
+		14, // 16KB (max HTTP/2 frame size used by gRPC)
+		15, // 32KB (default buffer size for gRPC)
+		16, // 64KB
+		17, // 128KB
+		19, // 512KB, max write buffer size
+	)
+	if err != nil {
+		panic(fmt.Sprintf("Failed to create write buffer pool: %v", err))
+	}
+	writeBufPool = pool
+}
+
 // RegisterProtocol register a ALTS record encryption protocol.
 func RegisterProtocol(protocol string, f ALTSRecordFunc) error {
 	if _, ok := protocols[protocol]; ok {
@@ -97,9 +113,6 @@ type conn struct {
 	// protected holds data read from the network but have not yet been
 	// decrypted. This data might not compose a complete frame.
 	protected []byte
-	// writeBuf is a buffer used to contain encrypted frames before being
-	// written to the network.
-	writeBuf []byte
 	// nextFrame stores the next frame (in protected buffer) info.
 	nextFrame []byte
 	// overhead is the calculated overhead of each frame.
@@ -132,7 +145,6 @@ func NewConn(c net.Conn, side core.Side, recordProtocol string, key []byte, prot
 		crypto:             crypto,
 		payloadLengthLimit: payloadLengthLimit,
 		protected:          protectedBuf,
-		writeBuf:           make([]byte, altsWriteBufferInitialSize),
 		nextFrame:          protectedBuf,
 		overhead:           overhead,
 	}
@@ -233,16 +245,16 @@ func (p *conn) Write(b []byte) (n int, err error) {
 	// Calculate the output buffer size with framing and encryption overhead.
 	numOfFrames := int(math.Ceil(float64(len(b)) / float64(p.payloadLengthLimit)))
 	size := len(b) + numOfFrames*p.overhead
-	// If writeBuf is too small, increase its size up to the maximum size.
 	partialBSize := len(b)
 	if size > altsWriteBufferMaxSize {
 		size = altsWriteBufferMaxSize
 		const numOfFramesInMaxWriteBuf = altsWriteBufferMaxSize / altsRecordDefaultLength
 		partialBSize = numOfFramesInMaxWriteBuf * p.payloadLengthLimit
 	}
-	if len(p.writeBuf) < size {
-		p.writeBuf = make([]byte, size)
-	}
+	// Get a writeBuf of the required length.
+	bufHandle := writeBufPool.Get(size)
+	defer writeBufPool.Put(bufHandle)
+	writeBuf := *bufHandle
 
 	for partialBStart := 0; partialBStart < len(b); partialBStart += partialBSize {
 		partialBEnd := partialBStart + partialBSize
@@ -263,7 +275,7 @@ func (p *conn) Write(b []byte) (n int, err error) {
 			// if any.
 
 			// 1. Fill in type field.
-			msg := p.writeBuf[writeBufIndex+MsgLenFieldSize:]
+			msg := writeBuf[writeBufIndex+MsgLenFieldSize:]
 			binary.LittleEndian.PutUint32(msg, altsRecordMsgType)
 
 			// 2. Encrypt the payload and create a tag if any.
@@ -273,12 +285,12 @@ func (p *conn) Write(b []byte) (n int, err error) {
 			}
 
 			// 3. Fill in the size field.
-			binary.LittleEndian.PutUint32(p.writeBuf[writeBufIndex:], uint32(len(msg)))
+			binary.LittleEndian.PutUint32(writeBuf[writeBufIndex:], uint32(len(msg)))
 
 			// 4. Increase writeBufIndex.
 			writeBufIndex += len(buf) + p.overhead
 		}
-		nn, err := p.Conn.Write(p.writeBuf[:writeBufIndex])
+		nn, err := p.Conn.Write(writeBuf[:writeBufIndex])
 		if err != nil {
 			// We need to calculate the actual data size that was
 			// written. This means we need to remove header,
diff --git a/credentials/alts/internal/conn/record_test.go b/credentials/alts/internal/conn/record_test.go
@@ -369,3 +369,17 @@ func (s) TestProtectedBuffer(t *testing.T) {
 		testProtectedBuffer(t, rp)
 	}
 }
+
+// BenchmarkMemoryUsage measures the allocations per ALTS connection.
+// Run this with: go test -bench=BenchmarkMemoryUsage -benchmem
+func BenchmarkMemoryUsage(b *testing.B) {
+	b.ReportAllocs()
+
+	for i := 0; i < b.N; i++ {
+		c, _ := newConnPair(rekeyRecordProtocol, nil, nil)
+
+		if _, err := c.Write([]byte("d")); err != nil {
+			b.Fatalf("Write failed: %v", err)
+		}
+	}
+}
diff --git a/internal/mem/buffer_pool.go b/internal/mem/buffer_pool.go
@@ -16,7 +16,8 @@
  *
  */
 
-// Package mem provides a tiered buffer pool implementation for efficient memory management.
+// Package mem provides utilities that facilitate memory reuse in byte slices
+// that are used as buffers.
 package mem
 
 import (
@@ -46,7 +47,8 @@ type bufferPool interface {
 	Put(*[]byte)
 }
 
-// BinaryTieredBufferPool is a buffer pool that uses multiple sub-pools with power-of-two sizes.
+// BinaryTieredBufferPool is a buffer pool that uses multiple sub-pools with
+// power-of-two sizes.
 type BinaryTieredBufferPool struct {
 	// exponentToNextLargestPoolMap maps a power-of-two exponent (e.g., 12 for
 	// 4KB) to the index of the next largest sizedBufferPool. This is used by
@@ -69,12 +71,27 @@ type BinaryTieredBufferPool struct {
 // of 2), not the raw byte sizes. For example, to create a pool of 16KB buffers
 // (2^14 bytes), pass 14 as the argument.
 func NewBinaryTieredBufferPool(powerOfTwoExponents ...uint8) (*BinaryTieredBufferPool, error) {
+	return newBinaryTiered(func(size int) bufferPool {
+		return newSizedBufferPool(size, true)
+	}, &simpleBufferPool{shouldZero: true}, powerOfTwoExponents...)
+}
+
+// NewDirtyBinaryTieredBufferPool returns a BufferPool backed by multiple
+// sub-pools. It is similar to NewBinaryTieredBufferPool but it does not
+// initialize the buffers before returning them.
+func NewDirtyBinaryTieredBufferPool(powerOfTwoExponents ...uint8) (*BinaryTieredBufferPool, error) {
+	return newBinaryTiered(func(size int) bufferPool {
+		return newSizedBufferPool(size, false)
+	}, &simpleBufferPool{shouldZero: false}, powerOfTwoExponents...)
+}
+
+func newBinaryTiered(sizedPoolFactory func(int) bufferPool, fallbackPool bufferPool, powerOfTwoExponents ...uint8) (*BinaryTieredBufferPool, error) {
 	slices.Sort(powerOfTwoExponents)
 	powerOfTwoExponents = slices.Compact(powerOfTwoExponents)
 
 	// Determine the maximum exponent we need to support. This depends on the
 	// word size (32-bit vs 64-bit).
-	maxExponent := uintSize - 1
+	maxExponent := uintSize - 2
 	indexOfNextLargestBit := slices.Repeat([]int{-1}, maxExponent+1)
 	indexOfPreviousLargestBit := slices.Repeat([]int{-1}, maxExponent+1)
 
@@ -88,7 +105,7 @@ func NewBinaryTieredBufferPool(powerOfTwoExponents ...uint8) (*BinaryTieredBuffe
 			return nil, fmt.Errorf("mem: allocating slice of size 2^%d is not possible", exp)
 		}
 		tierSize := 1 << exp
-		pools = append(pools, newSizedBufferPool(tierSize))
+		pools = append(pools, sizedPoolFactory(tierSize))
 		maxTier = max(maxTier, tierSize)
 
 		// Map the exact power of 2 to this pool index.
@@ -117,7 +134,7 @@ func NewBinaryTieredBufferPool(powerOfTwoExponents ...uint8) (*BinaryTieredBuffe
 		exponentToPreviousLargestPoolMap: indexOfPreviousLargestBit,
 		sizedPools:                       pools,
 		maxPoolCap:                       maxTier,
-		fallbackPool:                     &simpleBufferPool{},
+		fallbackPool:                     fallbackPool,
 	}, nil
 }
 
@@ -203,6 +220,7 @@ func (NopBufferPool) Put(*[]byte) {
 type sizedBufferPool struct {
 	pool        sync.Pool
 	defaultSize int
+	shouldZero  bool
 }
 
 func (p *sizedBufferPool) Get(size int) *[]byte {
@@ -212,7 +230,9 @@ func (p *sizedBufferPool) Get(size int) *[]byte {
 		return &buf
 	}
 	b := *buf
-	clear(b[:cap(b)])
+	if p.shouldZero {
+		clear(b[:cap(b)])
+	}
 	*buf = b[:size]
 	return buf
 }
@@ -227,9 +247,10 @@ func (p *sizedBufferPool) Put(buf *[]byte) {
 	p.pool.Put(buf)
 }
 
-func newSizedBufferPool(size int) *sizedBufferPool {
+func newSizedBufferPool(size int, zero bool) *sizedBufferPool {
 	return &sizedBufferPool{
 		defaultSize: size,
+		shouldZero:  zero,
 	}
 }
 
@@ -246,10 +267,11 @@ func NewTieredBufferPool(poolSizes ...int) *TieredBufferPool {
 	sort.Ints(poolSizes)
 	pools := make([]*sizedBufferPool, len(poolSizes))
 	for i, s := range poolSizes {
-		pools[i] = newSizedBufferPool(s)
+		pools[i] = newSizedBufferPool(s, true)
 	}
 	return &TieredBufferPool{
-		sizedPools: pools,
+		sizedPools:   pools,
+		fallbackPool: simpleBufferPool{shouldZero: true},
 	}
 }
 
@@ -280,13 +302,16 @@ func (p *TieredBufferPool) getPool(size int) bufferPool {
 // acquire a buffer from the pool but if that buffer is too small, it returns it
 // to the pool and creates a new one.
 type simpleBufferPool struct {
-	pool sync.Pool
+	pool       sync.Pool
+	shouldZero bool
 }
 
 func (p *simpleBufferPool) Get(size int) *[]byte {
 	bs, ok := p.pool.Get().(*[]byte)
 	if ok && cap(*bs) >= size {
-		clear((*bs)[:cap(*bs)])
+		if p.shouldZero {
+			clear((*bs)[:cap(*bs)])
+		}
 		*bs = (*bs)[:size]
 		return bs
 	}
diff --git a/internal/mem/buffer_pool_ext_test.go b/internal/mem/buffer_pool_ext_test.go
@@ -0,0 +1,118 @@
+/*
+ *
+ * Copyright 2026 gRPC authors.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ *
+ */
+
+package mem_test
+
+import (
+	"testing"
+	"unsafe"
+
+	"google.golang.org/grpc/internal/grpctest"
+	"google.golang.org/grpc/internal/mem"
+)
+
+type s struct {
+	grpctest.Tester
+}
+
+func Test(t *testing.T) {
+	grpctest.RunSubTests(t, s{})
+}
+
+func (s) TestBufferPool_Clears(t *testing.T) {
+	poolConfigs := []struct {
+		name        string
+		factory     func() (*mem.BinaryTieredBufferPool, error)
+		wantCleared bool
+		bufferSize  int
+	}{
+		{
+			name: "regular_sized",
+			factory: func() (*mem.BinaryTieredBufferPool, error) {
+				return mem.NewBinaryTieredBufferPool(3) // 8 bytes
+			},
+			bufferSize:  8,
+			wantCleared: true,
+		},
+		{
+			name: "regular_fallback",
+			factory: func() (*mem.BinaryTieredBufferPool, error) {
+				return mem.NewBinaryTieredBufferPool(3)
+			},
+			bufferSize:  10,
+			wantCleared: true,
+		},
+		{
+			name: "dirty_sized",
+			factory: func() (*mem.BinaryTieredBufferPool, error) {
+				return mem.NewDirtyBinaryTieredBufferPool(3)
+			},
+			bufferSize:  8,
+			wantCleared: false,
+		},
+		{
+			name: "dirty_fallback",
+			factory: func() (*mem.BinaryTieredBufferPool, error) {
+				return mem.NewDirtyBinaryTieredBufferPool(3)
+			},
+			bufferSize:  10,
+			wantCleared: false,
+		},
+	}
+
+	for _, tc := range poolConfigs {
+		t.Run(tc.name, func(t *testing.T) {
+			pool, err := tc.factory()
+			if err != nil {
+				t.Fatalf("Failed to create pool: %v", err)
+			}
+
+			for {
+				buf1 := pool.Get(tc.bufferSize)
+				// Mark the buffer with data.
+				for i := range *buf1 {
+					(*buf1)[i] = 0xAA
+				}
+				pool.Put(buf1)
+
+				buf2 := pool.Get(tc.bufferSize)
+				// Check if we got the same underlying array.
+				if unsafe.SliceData(*buf1) != unsafe.SliceData(*buf2) {
+					pool.Put(buf2)
+					continue
+				}
+
+				// We have a reused buffer. Check if it's cleared.
+				gotCleared := true
+				for _, b := range *buf2 {
+					if b != 0 {
+						gotCleared = false
+						break
+					}
+				}
+
+				if tc.wantCleared != gotCleared {
+					t.Fatalf("buffer cleared state mismatch: want %t, got %v", tc.wantCleared, gotCleared)
+				}
+
+				pool.Put(buf2)
+				break
+			}
+		})
+	}
+}
diff --git a/internal/mem/buffer_pool_test.go b/internal/mem/buffer_pool_test.go