seaweedfs/weed/mq/kafka/protocol/fetch_multibatch.go


								package protocol


								import (

									"bytes"

									"compress/gzip"

									"context"

									"encoding/binary"

									"fmt"

									"hash/crc32"

									"strings"


									"github.com/seaweedfs/seaweedfs/weed/glog"

									"github.com/seaweedfs/seaweedfs/weed/mq/kafka/compression"

									"github.com/seaweedfs/seaweedfs/weed/mq/kafka/integration"

								)


								// MultiBatchFetcher handles fetching multiple record batches with size limits

								type MultiBatchFetcher struct {

									handler *Handler

								}


								// NewMultiBatchFetcher creates a new multi-batch fetcher

								func NewMultiBatchFetcher(handler *Handler) *MultiBatchFetcher {

									return &MultiBatchFetcher{handler: handler}

								}


								// FetchResult represents the result of a multi-batch fetch operation

								type FetchResult struct {

									RecordBatches []byte // Concatenated record batches

									NextOffset    int64  // Next offset to fetch from

									TotalSize     int32  // Total size of all batches

									BatchCount    int    // Number of batches included

								}


								// FetchMultipleBatches fetches multiple record batches up to maxBytes limit

								// ctx controls the fetch timeout (should match Kafka fetch request's MaxWaitTime)

								func (f *MultiBatchFetcher) FetchMultipleBatches(ctx context.Context, topicName string, partitionID int32, startOffset, highWaterMark int64, maxBytes int32) (*FetchResult, error) {


									if startOffset >= highWaterMark {

										return &FetchResult{

											RecordBatches: []byte{},

											NextOffset:    startOffset,

											TotalSize:     0,

											BatchCount:    0,

										}, nil

									}


									// Minimum size for basic response headers and one empty batch

									minResponseSize := int32(200)

									if maxBytes < minResponseSize {

										maxBytes = minResponseSize

									}


									var combinedBatches []byte

									currentOffset := startOffset

									totalSize := int32(0)

									batchCount := 0


									// Estimate records per batch based on maxBytes available

									// Assume average message size + batch overhead

									// Client requested maxBytes, we should use most of it

									// Start with larger batches to maximize throughput

									estimatedMsgSize := int32(1024)                        // Typical message size with overhead

									recordsPerBatch := (maxBytes - 200) / estimatedMsgSize // Use available space efficiently

									if recordsPerBatch < 100 {

										recordsPerBatch = 100 // Minimum 100 records per batch

									}

									if recordsPerBatch > 10000 {

										recordsPerBatch = 10000 // Cap at 10k records per batch to avoid huge memory allocations

									}

									maxBatchesPerFetch := int((maxBytes - 200) / (estimatedMsgSize * 10)) // Reasonable limit

									if maxBatchesPerFetch < 5 {

										maxBatchesPerFetch = 5 // At least 5 batches

									}

									if maxBatchesPerFetch > 100 {

										maxBatchesPerFetch = 100 // At most 100 batches

									}


									for batchCount < maxBatchesPerFetch && currentOffset < highWaterMark {


										// Calculate remaining space

										remainingBytes := maxBytes - totalSize

										if remainingBytes < 100 { // Need at least 100 bytes for a minimal batch

											break

										}


										// Adapt records per batch based on remaining space

										// If we have less space remaining, fetch fewer records to avoid going over

										currentBatchSize := recordsPerBatch

										if remainingBytes < recordsPerBatch*estimatedMsgSize {

											currentBatchSize = remainingBytes / estimatedMsgSize

											if currentBatchSize < 1 {

												currentBatchSize = 1

											}

										}


										// Calculate how many records to fetch for this batch

										recordsAvailable := highWaterMark - currentOffset

										if recordsAvailable <= 0 {

											break

										}


										recordsToFetch := currentBatchSize

										if int64(recordsToFetch) > recordsAvailable {

											recordsToFetch = int32(recordsAvailable)

										}


										// Check if handler is nil

										if f.handler == nil {

											break

										}

										if f.handler.seaweedMQHandler == nil {

											break

										}


										// Fetch records for this batch

										// Pass context to respect Kafka fetch request's MaxWaitTime

										smqRecords, err := f.handler.seaweedMQHandler.GetStoredRecords(ctx, topicName, partitionID, currentOffset, int(recordsToFetch))


										if err != nil || len(smqRecords) == 0 {

											break

										}


										// Note: we construct the batch and check actual size after construction


										// Construct record batch

										batch := f.constructSingleRecordBatch(topicName, currentOffset, smqRecords)

										batchSize := int32(len(batch))


										// Double-check actual size doesn't exceed maxBytes

										if totalSize+batchSize > maxBytes && batchCount > 0 {

											break

										}


										// Add this batch to combined result

										combinedBatches = append(combinedBatches, batch...)

										totalSize += batchSize

										currentOffset += int64(len(smqRecords))

										batchCount++


										// If this is a small batch, we might be at the end

										if len(smqRecords) < int(recordsPerBatch) {

											break

										}

									}


									result := &FetchResult{

										RecordBatches: combinedBatches,

										NextOffset:    currentOffset,

										TotalSize:     totalSize,

										BatchCount:    batchCount,

									}


									return result, nil

								}


								// constructSingleRecordBatch creates a single record batch from SMQ records

								func (f *MultiBatchFetcher) constructSingleRecordBatch(topicName string, baseOffset int64, smqRecords []integration.SMQRecord) []byte {

									if len(smqRecords) == 0 {

										return f.constructEmptyRecordBatch(baseOffset)

									}


									// Create record batch using the SMQ records

									batch := make([]byte, 0, 512)


									// Record batch header

									baseOffsetBytes := make([]byte, 8)

									binary.BigEndian.PutUint64(baseOffsetBytes, uint64(baseOffset))

									batch = append(batch, baseOffsetBytes...) // base offset (8 bytes)


									// Calculate batch length (will be filled after we know the size)

									batchLengthPos := len(batch)

									batch = append(batch, 0, 0, 0, 0) // batch length placeholder (4 bytes)


									// Partition leader epoch (4 bytes) - use 0 (real Kafka uses 0, not -1)

									batch = append(batch, 0x00, 0x00, 0x00, 0x00)


									// Magic byte (1 byte) - v2 format

									batch = append(batch, 2)


									// CRC placeholder (4 bytes) - will be calculated later

									crcPos := len(batch)

									batch = append(batch, 0, 0, 0, 0)


									// Attributes (2 bytes) - no compression, etc.

									batch = append(batch, 0, 0)


									// Last offset delta (4 bytes)

									lastOffsetDelta := int32(len(smqRecords) - 1)

									lastOffsetDeltaBytes := make([]byte, 4)

									binary.BigEndian.PutUint32(lastOffsetDeltaBytes, uint32(lastOffsetDelta))

									batch = append(batch, lastOffsetDeltaBytes...)


									// Base timestamp (8 bytes) - convert from nanoseconds to milliseconds for Kafka compatibility

									baseTimestamp := smqRecords[0].GetTimestamp() / 1000000 // Convert nanoseconds to milliseconds

									baseTimestampBytes := make([]byte, 8)

									binary.BigEndian.PutUint64(baseTimestampBytes, uint64(baseTimestamp))

									batch = append(batch, baseTimestampBytes...)


									// Max timestamp (8 bytes) - convert from nanoseconds to milliseconds for Kafka compatibility

									maxTimestamp := baseTimestamp

									if len(smqRecords) > 1 {

										maxTimestamp = smqRecords[len(smqRecords)-1].GetTimestamp() / 1000000 // Convert nanoseconds to milliseconds

									}

									maxTimestampBytes := make([]byte, 8)

									binary.BigEndian.PutUint64(maxTimestampBytes, uint64(maxTimestamp))

									batch = append(batch, maxTimestampBytes...)


									// Producer ID (8 bytes) - use -1 for no producer ID

									batch = append(batch, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF)


									// Producer epoch (2 bytes) - use -1 for no producer epoch

									batch = append(batch, 0xFF, 0xFF)


									// Base sequence (4 bytes) - use -1 for no base sequence

									batch = append(batch, 0xFF, 0xFF, 0xFF, 0xFF)


									// Records count (4 bytes)

									recordCountBytes := make([]byte, 4)

									binary.BigEndian.PutUint32(recordCountBytes, uint32(len(smqRecords)))

									batch = append(batch, recordCountBytes...)


									// Add individual records from SMQ records

									for i, smqRecord := range smqRecords {

										// Build individual record

										recordBytes := make([]byte, 0, 128)


										// Record attributes (1 byte)

										recordBytes = append(recordBytes, 0)


										// Timestamp delta (varint) - calculate from base timestamp (both in milliseconds)

										recordTimestampMs := smqRecord.GetTimestamp() / 1000000 // Convert nanoseconds to milliseconds

										timestampDelta := recordTimestampMs - baseTimestamp     // Both in milliseconds now

										recordBytes = append(recordBytes, encodeVarint(timestampDelta)...)


										// Offset delta (varint)

										offsetDelta := int64(i)

										recordBytes = append(recordBytes, encodeVarint(offsetDelta)...)


										// Key length and key (varint + data) - decode RecordValue to get original Kafka message

										key := f.handler.decodeRecordValueToKafkaMessage(topicName, smqRecord.GetKey())

										if key == nil {

											recordBytes = append(recordBytes, encodeVarint(-1)...) // null key

										} else {

											recordBytes = append(recordBytes, encodeVarint(int64(len(key)))...)

											recordBytes = append(recordBytes, key...)

										}


										// Value length and value (varint + data) - decode RecordValue to get original Kafka message

										value := f.handler.decodeRecordValueToKafkaMessage(topicName, smqRecord.GetValue())


										if value == nil {

											recordBytes = append(recordBytes, encodeVarint(-1)...) // null value

										} else {

											recordBytes = append(recordBytes, encodeVarint(int64(len(value)))...)

											recordBytes = append(recordBytes, value...)

										}


										// Headers count (varint) - 0 headers

										recordBytes = append(recordBytes, encodeVarint(0)...)


										// Prepend record length (varint)

										recordLength := int64(len(recordBytes))

										batch = append(batch, encodeVarint(recordLength)...)

										batch = append(batch, recordBytes...)

									}


									// Fill in the batch length

									batchLength := uint32(len(batch) - batchLengthPos - 4)

									binary.BigEndian.PutUint32(batch[batchLengthPos:batchLengthPos+4], batchLength)


									// Debug: Log reconstructed batch (only at high verbosity)

									if glog.V(4) {

										fmt.Printf("\n━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\n")

										fmt.Printf("📏 RECONSTRUCTED BATCH: topic=%s baseOffset=%d size=%d bytes, recordCount=%d\n",

											topicName, baseOffset, len(batch), len(smqRecords))

									}


									if glog.V(4) && len(batch) >= 61 {

										fmt.Printf("  Header Structure:\n")

										fmt.Printf("    Base Offset (0-7):     %x\n", batch[0:8])

										fmt.Printf("    Batch Length (8-11):   %x\n", batch[8:12])

										fmt.Printf("    Leader Epoch (12-15):  %x\n", batch[12:16])

										fmt.Printf("    Magic (16):            %x\n", batch[16:17])

										fmt.Printf("    CRC (17-20):           %x (WILL BE CALCULATED)\n", batch[17:21])

										fmt.Printf("    Attributes (21-22):    %x\n", batch[21:23])

										fmt.Printf("    Last Offset Delta (23-26): %x\n", batch[23:27])

										fmt.Printf("    Base Timestamp (27-34): %x\n", batch[27:35])

										fmt.Printf("    Max Timestamp (35-42):  %x\n", batch[35:43])

										fmt.Printf("    Producer ID (43-50):    %x\n", batch[43:51])

										fmt.Printf("    Producer Epoch (51-52): %x\n", batch[51:53])

										fmt.Printf("    Base Sequence (53-56):  %x\n", batch[53:57])

										fmt.Printf("    Record Count (57-60):   %x\n", batch[57:61])

										if len(batch) > 61 {

											fmt.Printf("    Records Section (61+):  %x... (%d bytes)\n",

												batch[61:min(81, len(batch))], len(batch)-61)

										}

									}


									// Calculate CRC32 for the batch

									// Per Kafka spec: CRC covers ONLY from attributes offset (byte 21) onwards

									// See: DefaultRecordBatch.java computeChecksum() - Crc32C.compute(buffer, ATTRIBUTES_OFFSET, ...)

									crcData := batch[crcPos+4:] // Skip CRC field itself, include rest

									crc := crc32.Checksum(crcData, crc32.MakeTable(crc32.Castagnoli))


									// CRC debug (only at high verbosity)

									if glog.V(4) {

										batchLengthValue := binary.BigEndian.Uint32(batch[8:12])

										expectedTotalSize := 12 + int(batchLengthValue)

										actualTotalSize := len(batch)


										fmt.Printf("\n  === CRC CALCULATION DEBUG ===\n")

										fmt.Printf("    Batch length field (bytes 8-11): %d\n", batchLengthValue)

										fmt.Printf("    Expected total batch size: %d bytes (12 + %d)\n", expectedTotalSize, batchLengthValue)

										fmt.Printf("    Actual batch size: %d bytes\n", actualTotalSize)

										fmt.Printf("    CRC position: byte %d\n", crcPos)

										fmt.Printf("    CRC data range: bytes %d to %d (%d bytes)\n", crcPos+4, actualTotalSize-1, len(crcData))


										if expectedTotalSize != actualTotalSize {

											fmt.Printf("    SIZE MISMATCH: %d bytes difference!\n", actualTotalSize-expectedTotalSize)

										}


										if crcPos != 17 {

											fmt.Printf("    CRC POSITION WRONG: expected 17, got %d!\n", crcPos)

										}


										fmt.Printf("    CRC data (first 100 bytes of %d):\n", len(crcData))

										dumpSize := 100

										if len(crcData) < dumpSize {

											dumpSize = len(crcData)

										}

										for i := 0; i < dumpSize; i += 20 {

											end := i + 20

											if end > dumpSize {

												end = dumpSize

											}

											fmt.Printf("      [%3d-%3d]: %x\n", i, end-1, crcData[i:end])

										}


										manualCRC := crc32.Checksum(crcData, crc32.MakeTable(crc32.Castagnoli))

										fmt.Printf("    Calculated CRC: 0x%08x\n", crc)

										fmt.Printf("    Manual verify:  0x%08x", manualCRC)

										if crc == manualCRC {

											fmt.Printf(" OK\n")

										} else {

											fmt.Printf(" MISMATCH!\n")

										}


										if actualTotalSize <= 200 {

											fmt.Printf("    Complete batch hex dump (%d bytes):\n", actualTotalSize)

											for i := 0; i < actualTotalSize; i += 16 {

												end := i + 16

												if end > actualTotalSize {

													end = actualTotalSize

												}

												fmt.Printf("      %04d: %x\n", i, batch[i:end])

											}

										}

										fmt.Printf("  === END CRC DEBUG ===\n\n")

									}


									binary.BigEndian.PutUint32(batch[crcPos:crcPos+4], crc)


									if glog.V(4) {

										fmt.Printf("    Final CRC (17-20):     %x (calculated over %d bytes)\n", batch[17:21], len(crcData))


										// VERIFICATION: Read back what we just wrote

										writtenCRC := binary.BigEndian.Uint32(batch[17:21])

										fmt.Printf("    VERIFICATION: CRC we calculated=0x%x, CRC written to batch=0x%x", crc, writtenCRC)

										if crc == writtenCRC {

											fmt.Printf(" OK\n")

										} else {

											fmt.Printf(" MISMATCH!\n")

										}


										// DEBUG: Hash the entire batch to check if reconstructions are identical

										batchHash := crc32.ChecksumIEEE(batch)

										fmt.Printf("    BATCH IDENTITY: hash=0x%08x size=%d topic=%s baseOffset=%d recordCount=%d\n",

											batchHash, len(batch), topicName, baseOffset, len(smqRecords))


										// DEBUG: Show first few record keys/values to verify consistency

										if len(smqRecords) > 0 && strings.Contains(topicName, "loadtest") {

											fmt.Printf("    RECORD SAMPLES:\n")

											for i := 0; i < min(3, len(smqRecords)); i++ {

												keyPreview := smqRecords[i].GetKey()

												if len(keyPreview) > 20 {

													keyPreview = keyPreview[:20]

												}

												valuePreview := smqRecords[i].GetValue()

												if len(valuePreview) > 40 {

													valuePreview = valuePreview[:40]

												}

												fmt.Printf("      [%d] keyLen=%d valueLen=%d keyHex=%x valueHex=%x\n",

													i, len(smqRecords[i].GetKey()), len(smqRecords[i].GetValue()),

													keyPreview, valuePreview)

											}

										}


										fmt.Printf("    Batch for topic=%s baseOffset=%d recordCount=%d\n", topicName, baseOffset, len(smqRecords))

										fmt.Printf("━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━\n\n")

									}


									return batch

								}


								// constructEmptyRecordBatch creates an empty record batch

								func (f *MultiBatchFetcher) constructEmptyRecordBatch(baseOffset int64) []byte {

									// Create minimal empty record batch

									batch := make([]byte, 0, 61)


									// Base offset (8 bytes)

									baseOffsetBytes := make([]byte, 8)

									binary.BigEndian.PutUint64(baseOffsetBytes, uint64(baseOffset))

									batch = append(batch, baseOffsetBytes...)


									// Batch length (4 bytes) - will be filled at the end

									lengthPos := len(batch)

									batch = append(batch, 0, 0, 0, 0)


									// Partition leader epoch (4 bytes) - -1

									batch = append(batch, 0xFF, 0xFF, 0xFF, 0xFF)


									// Magic byte (1 byte) - version 2

									batch = append(batch, 2)


									// CRC32 (4 bytes) - placeholder

									crcPos := len(batch)

									batch = append(batch, 0, 0, 0, 0)


									// Attributes (2 bytes) - no compression, no transactional

									batch = append(batch, 0, 0)


									// Last offset delta (4 bytes) - -1 for empty batch

									batch = append(batch, 0xFF, 0xFF, 0xFF, 0xFF)


									// Base timestamp (8 bytes)

									timestamp := uint64(1640995200000) // Fixed timestamp for empty batches

									timestampBytes := make([]byte, 8)

									binary.BigEndian.PutUint64(timestampBytes, timestamp)

									batch = append(batch, timestampBytes...)


									// Max timestamp (8 bytes) - same as base for empty batch

									batch = append(batch, timestampBytes...)


									// Producer ID (8 bytes) - -1 for non-transactional

									batch = append(batch, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF)


									// Producer Epoch (2 bytes) - -1 for non-transactional

									batch = append(batch, 0xFF, 0xFF)


									// Base Sequence (4 bytes) - -1 for non-transactional

									batch = append(batch, 0xFF, 0xFF, 0xFF, 0xFF)


									// Record count (4 bytes) - 0 for empty batch

									batch = append(batch, 0, 0, 0, 0)


									// Fill in the batch length

									batchLength := len(batch) - 12 // Exclude base offset and length field itself

									binary.BigEndian.PutUint32(batch[lengthPos:lengthPos+4], uint32(batchLength))


									// Calculate CRC32 for the batch

									// Per Kafka spec: CRC covers ONLY from attributes offset (byte 21) onwards

									// See: DefaultRecordBatch.java computeChecksum() - Crc32C.compute(buffer, ATTRIBUTES_OFFSET, ...)

									crcData := batch[crcPos+4:] // Skip CRC field itself, include rest

									crc := crc32.Checksum(crcData, crc32.MakeTable(crc32.Castagnoli))

									binary.BigEndian.PutUint32(batch[crcPos:crcPos+4], crc)


									return batch

								}


								// CompressedBatchResult represents a compressed record batch result

								type CompressedBatchResult struct {

									CompressedData []byte

									OriginalSize   int32

									CompressedSize int32

									Codec          compression.CompressionCodec

								}


								// CreateCompressedBatch creates a compressed record batch (basic support)

								func (f *MultiBatchFetcher) CreateCompressedBatch(baseOffset int64, smqRecords []integration.SMQRecord, codec compression.CompressionCodec) (*CompressedBatchResult, error) {

									if codec == compression.None {

										// No compression requested

										batch := f.constructSingleRecordBatch("", baseOffset, smqRecords)

										return &CompressedBatchResult{

											CompressedData: batch,

											OriginalSize:   int32(len(batch)),

											CompressedSize: int32(len(batch)),

											Codec:          compression.None,

										}, nil

									}


									// For Phase 5, implement basic GZIP compression support

									originalBatch := f.constructSingleRecordBatch("", baseOffset, smqRecords)

									originalSize := int32(len(originalBatch))


									compressedData, err := f.compressData(originalBatch, codec)

									if err != nil {

										// Fall back to uncompressed if compression fails

										return &CompressedBatchResult{

											CompressedData: originalBatch,

											OriginalSize:   originalSize,

											CompressedSize: originalSize,

											Codec:          compression.None,

										}, nil

									}


									// Create compressed record batch with proper headers

									compressedBatch := f.constructCompressedRecordBatch(baseOffset, compressedData, codec, originalSize)


									return &CompressedBatchResult{

										CompressedData: compressedBatch,

										OriginalSize:   originalSize,

										CompressedSize: int32(len(compressedBatch)),

										Codec:          codec,

									}, nil

								}


								// constructCompressedRecordBatch creates a record batch with compressed records

								func (f *MultiBatchFetcher) constructCompressedRecordBatch(baseOffset int64, compressedRecords []byte, codec compression.CompressionCodec, originalSize int32) []byte {

									// Validate size to prevent overflow

									const maxBatchSize = 1 << 30 // 1 GB limit

									if len(compressedRecords) > maxBatchSize-100 {

										glog.Errorf("Compressed records too large: %d bytes", len(compressedRecords))

										return nil

									}

									batch := make([]byte, 0, len(compressedRecords)+100)


									// Record batch header is similar to regular batch

									baseOffsetBytes := make([]byte, 8)

									binary.BigEndian.PutUint64(baseOffsetBytes, uint64(baseOffset))

									batch = append(batch, baseOffsetBytes...)


									// Batch length (4 bytes) - will be filled later

									batchLengthPos := len(batch)

									batch = append(batch, 0, 0, 0, 0)


									// Partition leader epoch (4 bytes)

									batch = append(batch, 0xFF, 0xFF, 0xFF, 0xFF)


									// Magic byte (1 byte) - v2 format

									batch = append(batch, 2)


									// CRC placeholder (4 bytes)

									crcPos := len(batch)

									batch = append(batch, 0, 0, 0, 0)


									// Attributes (2 bytes) - set compression bits

									var compressionBits uint16

									switch codec {

									case compression.Gzip:

										compressionBits = 1

									case compression.Snappy:

										compressionBits = 2

									case compression.Lz4:

										compressionBits = 3

									case compression.Zstd:

										compressionBits = 4

									default:

										compressionBits = 0 // no compression

									}

									batch = append(batch, byte(compressionBits>>8), byte(compressionBits))


									// Last offset delta (4 bytes) - for compressed batches, this represents the logical record count

									batch = append(batch, 0, 0, 0, 0) // Will be set based on logical records


									// Timestamps (16 bytes) - use current time for compressed batches

									timestamp := uint64(1640995200000)

									timestampBytes := make([]byte, 8)

									binary.BigEndian.PutUint64(timestampBytes, timestamp)

									batch = append(batch, timestampBytes...) // first timestamp

									batch = append(batch, timestampBytes...) // max timestamp


									// Producer fields (14 bytes total)

									batch = append(batch, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF, 0xFF) // producer ID

									batch = append(batch, 0xFF, 0xFF)                                     // producer epoch

									batch = append(batch, 0xFF, 0xFF, 0xFF, 0xFF)                         // base sequence


									// Record count (4 bytes) - for compressed batches, this is the number of logical records

									batch = append(batch, 0, 0, 0, 1) // Placeholder: treat as 1 logical record


									// Compressed records data

									batch = append(batch, compressedRecords...)


									// Fill in the batch length

									batchLength := uint32(len(batch) - batchLengthPos - 4)

									binary.BigEndian.PutUint32(batch[batchLengthPos:batchLengthPos+4], batchLength)


									// Calculate CRC32 for the batch

									// Per Kafka spec: CRC covers ONLY from attributes offset (byte 21) onwards

									// See: DefaultRecordBatch.java computeChecksum() - Crc32C.compute(buffer, ATTRIBUTES_OFFSET, ...)

									crcData := batch[crcPos+4:] // Skip CRC field itself, include rest

									crc := crc32.Checksum(crcData, crc32.MakeTable(crc32.Castagnoli))

									binary.BigEndian.PutUint32(batch[crcPos:crcPos+4], crc)


									return batch

								}


								// compressData compresses data using the specified codec (basic implementation)

								func (f *MultiBatchFetcher) compressData(data []byte, codec compression.CompressionCodec) ([]byte, error) {

									// For Phase 5, implement basic compression support

									switch codec {

									case compression.None:

										return data, nil

									case compression.Gzip:

										// Implement actual GZIP compression

										var buf bytes.Buffer

										gzipWriter := gzip.NewWriter(&buf)


										if _, err := gzipWriter.Write(data); err != nil {

											gzipWriter.Close()

											return nil, fmt.Errorf("gzip compression write failed: %w", err)

										}


										if err := gzipWriter.Close(); err != nil {

											return nil, fmt.Errorf("gzip compression close failed: %w", err)

										}


										compressed := buf.Bytes()


										return compressed, nil

									default:

										return nil, fmt.Errorf("unsupported compression codec: %d", codec)

									}

								}