clean up

1 month ago · d9cbc07b2a
3 changed files with 116 additions and 210 deletions
--- a/weed/s3api/s3api_object_handlers.go
+++ b/weed/s3api/s3api_object_handlers.go
@ -25,8 +25,8 @@ import (

 	"github.com/seaweedfs/seaweedfs/weed/s3api/s3_constants"
 	"github.com/seaweedfs/seaweedfs/weed/s3api/s3err"
-	"github.com/seaweedfs/seaweedfs/weed/util/mem"
 	util_http "github.com/seaweedfs/seaweedfs/weed/util/http"
+	"github.com/seaweedfs/seaweedfs/weed/util/mem"

 	"github.com/seaweedfs/seaweedfs/weed/glog"
 )
@ -46,6 +46,81 @@ var corsHeaders = []string{
 // Package-level to avoid per-call allocations in writeZeroBytes
 var zeroBuf = make([]byte, 32*1024)

+// adjustRangeForPart adjusts a client's Range header to absolute offsets within a part.
+// Parameters:
+//   - partStartOffset: the absolute start offset of the part in the object
+//   - partEndOffset: the absolute end offset of the part in the object
+//   - clientRangeHeader: the Range header value from the client (e.g., "bytes=0-99")
+//
+// Returns:
+//   - adjustedStart: the adjusted absolute start offset
+//   - adjustedEnd: the adjusted absolute end offset
+//   - error: nil on success, error if the range is invalid
+func adjustRangeForPart(partStartOffset, partEndOffset int64, clientRangeHeader string) (adjustedStart, adjustedEnd int64, err error) {
+	// If no range header, return the full part
+	if clientRangeHeader == "" || !strings.HasPrefix(clientRangeHeader, "bytes=") {
+		return partStartOffset, partEndOffset, nil
+	}
+
+	// Parse client's range request (relative to the part)
+	rangeSpec := clientRangeHeader[6:] // Remove "bytes=" prefix
+	parts := strings.Split(rangeSpec, "-")
+
+	if len(parts) != 2 {
+		return 0, 0, fmt.Errorf("invalid range format")
+	}
+
+	partSize := partEndOffset - partStartOffset + 1
+	var clientStart, clientEnd int64
+
+	// Parse start offset
+	if parts[0] != "" {
+		clientStart, err = strconv.ParseInt(parts[0], 10, 64)
+		if err != nil {
+			return 0, 0, fmt.Errorf("invalid range start: %w", err)
+		}
+	}
+
+	// Parse end offset
+	if parts[1] != "" {
+		clientEnd, err = strconv.ParseInt(parts[1], 10, 64)
+		if err != nil {
+			return 0, 0, fmt.Errorf("invalid range end: %w", err)
+		}
+	} else {
+		// No end specified, read to end of part
+		clientEnd = partSize - 1
+	}
+
+	// Handle suffix-range (e.g., "bytes=-100" means last 100 bytes)
+	if parts[0] == "" {
+		// suffix-range: clientEnd is actually the suffix length
+		suffixLength := clientEnd
+		if suffixLength > partSize {
+			suffixLength = partSize
+		}
+		clientStart = partSize - suffixLength
+		clientEnd = partSize - 1
+	}
+
+	// Validate range is within part boundaries
+	if clientStart < 0 || clientStart >= partSize {
+		return 0, 0, fmt.Errorf("range start %d out of bounds for part size %d", clientStart, partSize)
+	}
+	if clientEnd >= partSize {
+		clientEnd = partSize - 1
+	}
+	if clientStart > clientEnd {
+		return 0, 0, fmt.Errorf("range start %d > end %d", clientStart, clientEnd)
+	}
+
+	// Adjust to absolute offsets in the object
+	adjustedStart = partStartOffset + clientStart
+	adjustedEnd = partStartOffset + clientEnd
+
+	return adjustedStart, adjustedEnd, nil
+}
+
 // StreamError is returned when streaming functions encounter errors.
 // It tracks whether an HTTP response has already been written to prevent
 // double WriteHeader calls that would create malformed S3 error responses.
@ -620,72 +695,16 @@ func (s3a *S3ApiServer) GetObjectHandler(w http.ResponseWriter, r *http.Request)
 			// Check if client supplied a Range header - if so, apply it within the part's boundaries
 			// S3 allows both partNumber and Range together, where Range applies within the selected part
 			clientRangeHeader := r.Header.Get("Range")
-			if clientRangeHeader != "" && strings.HasPrefix(clientRangeHeader, "bytes=") {
-				// Parse client's range request (relative to the part)
-				rangeSpec := clientRangeHeader[6:] // Remove "bytes=" prefix
-				parts := strings.Split(rangeSpec, "-")
-				
-				if len(parts) == 2 {
-					partSize := endOffset - startOffset + 1
-					var clientStart, clientEnd int64
-					var parseErr error
-					
-					// Parse start offset
-					if parts[0] != "" {
-						clientStart, parseErr = strconv.ParseInt(parts[0], 10, 64)
-						if parseErr != nil {
-							glog.Warningf("GetObject: Invalid Range start for part %d: %s", partNumber, parts[0])
-							s3err.WriteErrorResponse(w, r, s3err.ErrInvalidRange)
-							return
-						}
-					}
-					
-					// Parse end offset
-					if parts[1] != "" {
-						clientEnd, parseErr = strconv.ParseInt(parts[1], 10, 64)
-						if parseErr != nil {
-							glog.Warningf("GetObject: Invalid Range end for part %d: %s", partNumber, parts[1])
-							s3err.WriteErrorResponse(w, r, s3err.ErrInvalidRange)
-							return
-						}
-					} else {
-						// No end specified, read to end of part
-						clientEnd = partSize - 1
-					}
-					
-					// Handle suffix-range (e.g., "bytes=-100" means last 100 bytes)
-					if parts[0] == "" {
-						// suffix-range: clientEnd is actually the suffix length
-						suffixLength := clientEnd
-						if suffixLength > partSize {
-							suffixLength = partSize
-						}
-						clientStart = partSize - suffixLength
-						clientEnd = partSize - 1
-					}
-					
-					// Validate range is within part boundaries
-					if clientStart < 0 || clientStart >= partSize {
-						glog.Warningf("GetObject: Range start %d out of bounds for part %d (size: %d)", clientStart, partNumber, partSize)
-						s3err.WriteErrorResponse(w, r, s3err.ErrInvalidRange)
-						return
-					}
-					if clientEnd >= partSize {
-						clientEnd = partSize - 1
-					}
-					if clientStart > clientEnd {
-						glog.Warningf("GetObject: Invalid Range: start %d > end %d for part %d", clientStart, clientEnd, partNumber)
-						s3err.WriteErrorResponse(w, r, s3err.ErrInvalidRange)
-						return
-					}
-					
-					// Adjust to absolute offsets in the object
-					partStartOffset := startOffset
-					startOffset = partStartOffset + clientStart
-					endOffset = partStartOffset + clientEnd
-					
-					glog.V(3).Infof("GetObject: Client Range %s applied to part %d, adjusted to bytes=%d-%d", clientRangeHeader, partNumber, startOffset, endOffset)
+			if clientRangeHeader != "" {
+				adjustedStart, adjustedEnd, rangeErr := adjustRangeForPart(startOffset, endOffset, clientRangeHeader)
+				if rangeErr != nil {
+					glog.Warningf("GetObject: Invalid Range for part %d: %v", partNumber, rangeErr)
+					s3err.WriteErrorResponse(w, r, s3err.ErrInvalidRange)
+					return
 				}
+				startOffset = adjustedStart
+				endOffset = adjustedEnd
+				glog.V(3).Infof("GetObject: Client Range %s applied to part %d, adjusted to bytes=%d-%d", clientRangeHeader, partNumber, startOffset, endOffset)
 			}

 			// Set Range header to read the requested bytes (full part or client-specified range within part)
@ -1463,14 +1482,14 @@ func writeZeroBytes(w io.Writer, n int64) error {
 // SSE-C multipart encryption (see lines 2772-2781) differs fundamentally from SSE-KMS/SSE-S3:
 //
 // 1. Encryption: CreateSSECEncryptedReader generates a RANDOM IV per part/chunk
-//    - Each part starts with a fresh random IV
-//    - CTR counter starts from 0 for each part: counter₀, counter₁, counter₂, ...
-//    - PartOffset is stored in metadata but NOT applied during encryption
+//   - Each part starts with a fresh random IV
+//   - CTR counter starts from 0 for each part: counter₀, counter₁, counter₂, ...
+//   - PartOffset is stored in metadata but NOT applied during encryption
 //
 // 2. Decryption: Use the stored IV directly WITHOUT offset adjustment
-//    - The stored IV already represents the start of this part's encryption
-//    - Applying calculateIVWithOffset would shift to counterₙ, misaligning the keystream
-//    - Result: XOR with wrong keystream = corrupted plaintext
+//   - The stored IV already represents the start of this part's encryption
+//   - Applying calculateIVWithOffset would shift to counterₙ, misaligning the keystream
+//   - Result: XOR with wrong keystream = corrupted plaintext
 //
 // This contrasts with SSE-KMS/SSE-S3 which use: base IV + calculateIVWithOffset(ChunkOffset)
 func (s3a *S3ApiServer) decryptSSECChunkView(ctx context.Context, fileChunk *filer_pb.FileChunk, chunkView *filer.ChunkView, customerKey *SSECustomerKey) (io.Reader, error) {
@ -1534,15 +1553,15 @@ func (s3a *S3ApiServer) decryptSSECChunkView(ctx context.Context, fileChunk *fil
 // SSE-KMS (and SSE-S3) use a fundamentally different IV scheme than SSE-C:
 //
 // 1. Encryption: Uses a BASE IV + offset calculation
-//    - Base IV is generated once for the entire object
-//    - For each chunk at position N: adjustedIV = calculateIVWithOffset(baseIV, N)
-//    - This shifts the CTR counter to counterₙ where n = N/16
-//    - ChunkOffset is stored in metadata and IS applied during encryption
+//   - Base IV is generated once for the entire object
+//   - For each chunk at position N: adjustedIV = calculateIVWithOffset(baseIV, N)
+//   - This shifts the CTR counter to counterₙ where n = N/16
+//   - ChunkOffset is stored in metadata and IS applied during encryption
 //
 // 2. Decryption: Apply the same offset calculation
-//    - Use calculateIVWithOffset(baseIV, ChunkOffset) to reconstruct the encryption IV
-//    - Also handle ivSkip for non-block-aligned offsets (intra-block positioning)
-//    - This ensures decryption uses the same CTR counter sequence as encryption
+//   - Use calculateIVWithOffset(baseIV, ChunkOffset) to reconstruct the encryption IV
+//   - Also handle ivSkip for non-block-aligned offsets (intra-block positioning)
+//   - This ensures decryption uses the same CTR counter sequence as encryption
 //
 // This contrasts with SSE-C which uses random IVs without offset calculation.
 func (s3a *S3ApiServer) decryptSSEKMSChunkView(ctx context.Context, fileChunk *filer_pb.FileChunk, chunkView *filer.ChunkView) (io.Reader, error) {
@ -1622,19 +1641,19 @@ func (s3a *S3ApiServer) decryptSSEKMSChunkView(ctx context.Context, fileChunk *f
 // SSE-S3 uses the same BASE IV + offset scheme as SSE-KMS, but with a subtle difference:
 //
 // 1. Encryption: Uses BASE IV + offset, but stores the ADJUSTED IV
-//    - Base IV is generated once for the entire object
-//    - For each chunk at position N: adjustedIV, skip = calculateIVWithOffset(baseIV, N)
-//    - The ADJUSTED IV (not base IV) is stored in chunk metadata
-//    - ChunkOffset calculation is performed during encryption
+//   - Base IV is generated once for the entire object
+//   - For each chunk at position N: adjustedIV, skip = calculateIVWithOffset(baseIV, N)
+//   - The ADJUSTED IV (not base IV) is stored in chunk metadata
+//   - ChunkOffset calculation is performed during encryption
 //
 // 2. Decryption: Use the stored adjusted IV directly
-//    - The stored IV is already block-aligned and ready to use
-//    - No need to call calculateIVWithOffset again (unlike SSE-KMS)
-//    - Decrypt full chunk from start, then skip to OffsetInChunk in plaintext
+//   - The stored IV is already block-aligned and ready to use
+//   - No need to call calculateIVWithOffset again (unlike SSE-KMS)
+//   - Decrypt full chunk from start, then skip to OffsetInChunk in plaintext
 //
 // This differs from:
-//    - SSE-C: Uses random IV per chunk, no offset calculation
-//    - SSE-KMS: Stores base IV, requires calculateIVWithOffset during decryption
+//   - SSE-C: Uses random IV per chunk, no offset calculation
+//   - SSE-KMS: Stores base IV, requires calculateIVWithOffset during decryption
 func (s3a *S3ApiServer) decryptSSES3ChunkView(ctx context.Context, fileChunk *filer_pb.FileChunk, chunkView *filer.ChunkView, entry *filer_pb.Entry) (io.Reader, error) {
 	// For multipart SSE-S3, each chunk has its own IV in chunk.SseMetadata
 	if fileChunk.GetSseType() == filer_pb.SSEType_SSE_S3 && len(fileChunk.GetSseMetadata()) > 0 {
--- a/weed/s3api/s3api_object_handlers_put.go
+++ b/weed/s3api/s3api_object_handlers_put.go
@ -2,7 +2,6 @@ package s3api

 import (
 	"context"
-	"crypto/md5"
 	"encoding/base64"
 	"encoding/json"
 	"errors"
@ -680,15 +679,8 @@ func (s3a *S3ApiServer) putSuspendedVersioningObject(r *http.Request, bucket, ob
 	// Normalize object path to ensure consistency with toFilerUrl behavior
 	normalizedObject := removeDuplicateSlashes(object)

-	// Enable detailed logging for testobjbar
-	isTestObj := (normalizedObject == "testobjbar")
-
-	glog.V(3).Infof("putSuspendedVersioningObject: START bucket=%s, object=%s, normalized=%s, isTestObj=%v",
-		bucket, object, normalizedObject, isTestObj)
-
-	if isTestObj {
-		glog.V(3).Infof("=== TESTOBJBAR: putSuspendedVersioningObject START ===")
-	}
+	glog.V(3).Infof("putSuspendedVersioningObject: START bucket=%s, object=%s, normalized=%s",
+		bucket, object, normalizedObject)

 	bucketDir := s3a.option.BucketsPath + "/" + bucket

@ -726,8 +718,7 @@ func (s3a *S3ApiServer) putSuspendedVersioningObject(r *http.Request, bucket, ob

 	uploadUrl := s3a.toFilerUrl(bucket, normalizedObject)

-	hash := md5.New()
-	var body = io.TeeReader(dataReader, hash)
+	body := dataReader
 	if objectContentType == "" {
 		body = mimeDetect(r, body)
 	}
@ -738,10 +729,6 @@ func (s3a *S3ApiServer) putSuspendedVersioningObject(r *http.Request, bucket, ob

 	// Set version ID to "null" for suspended versioning
 	r.Header.Set(s3_constants.ExtVersionIdKey, "null")
-	if isTestObj {
-		glog.V(3).Infof("=== TESTOBJBAR: set version header before putToFiler, r.Header[%s]=%s ===",
-			s3_constants.ExtVersionIdKey, r.Header.Get(s3_constants.ExtVersionIdKey))
-	}

 	// Extract and set object lock metadata as headers
 	// This handles retention mode, retention date, and legal hold
@ -792,44 +779,11 @@ func (s3a *S3ApiServer) putSuspendedVersioningObject(r *http.Request, bucket, ob
 	}

 	// Upload the file using putToFiler - this will create the file with version metadata
-	if isTestObj {
-		glog.V(3).Infof("=== TESTOBJBAR: calling putToFiler ===")
-	}
 	etag, errCode, sseMetadata = s3a.putToFiler(r, uploadUrl, body, bucket, 1)
 	if errCode != s3err.ErrNone {
 		glog.Errorf("putSuspendedVersioningObject: failed to upload object: %v", errCode)
 		return "", errCode, SSEResponseMetadata{}
 	}
-	if isTestObj {
-		glog.V(3).Infof("=== TESTOBJBAR: putToFiler completed, etag=%s ===", etag)
-	}
-
-	// Verify the metadata was set correctly during file creation
-	if isTestObj {
-		// Read back the entry to verify
-		maxRetries := 3
-		for attempt := 1; attempt <= maxRetries; attempt++ {
-			verifyEntry, verifyErr := s3a.getEntry(bucketDir, normalizedObject)
-			if verifyErr == nil {
-				glog.V(3).Infof("=== TESTOBJBAR: verify attempt %d, entry.Extended=%v ===", attempt, verifyEntry.Extended)
-				if verifyEntry.Extended != nil {
-					if versionIdBytes, ok := verifyEntry.Extended[s3_constants.ExtVersionIdKey]; ok {
-						glog.V(3).Infof("=== TESTOBJBAR: verification SUCCESSFUL, version=%s ===", string(versionIdBytes))
-					} else {
-						glog.V(3).Infof("=== TESTOBJBAR: verification FAILED, ExtVersionIdKey not found ===")
-					}
-				} else {
-					glog.V(3).Infof("=== TESTOBJBAR: verification FAILED, Extended is nil ===")
-				}
-				break
-			} else {
-				glog.V(3).Infof("=== TESTOBJBAR: getEntry failed on attempt %d: %v ===", attempt, verifyErr)
-			}
-			if attempt < maxRetries {
-				time.Sleep(time.Millisecond * 10)
-			}
-		}
-	}

 	// Update all existing versions/delete markers to set IsLatest=false since "null" is now latest
 	err = s3a.updateIsLatestFlagsForSuspendedVersioning(bucket, normalizedObject)
@ -839,9 +793,7 @@ func (s3a *S3ApiServer) putSuspendedVersioningObject(r *http.Request, bucket, ob
 	}

 	glog.V(2).Infof("putSuspendedVersioningObject: successfully created null version for %s/%s", bucket, object)
-	if isTestObj {
-		glog.V(3).Infof("=== TESTOBJBAR: putSuspendedVersioningObject COMPLETED ===")
-	}
+
 	return etag, s3err.ErrNone, sseMetadata
 }

@ -942,8 +894,7 @@ func (s3a *S3ApiServer) putVersionedObject(r *http.Request, bucket, object strin
 		return "", "", s3err.ErrInternalError, SSEResponseMetadata{}
 	}

-	hash := md5.New()
-	var body = io.TeeReader(dataReader, hash)
+	body := dataReader
 	if objectContentType == "" {
 		body = mimeDetect(r, body)
 	}
--- a/weed/s3api/s3api_object_handlers_test.go
+++ b/weed/s3api/s3api_object_handlers_test.go
@ -1,8 +1,6 @@
 package s3api

 import (
-	"strconv"
-	"strings"
 	"testing"
 	"time"

@ -245,75 +243,13 @@ func TestPartNumberWithRangeHeader(t *testing.T) {

 	for _, tt := range tests {
 		t.Run(tt.name, func(t *testing.T) {
-			// Simulate the range adjustment logic from GetObjectHandler
-			startOffset := tt.partStartOffset
-			endOffset := tt.partEndOffset
-			hasError := false
-
-			if tt.clientRangeHeader != "" && strings.HasPrefix(tt.clientRangeHeader, "bytes=") {
-				rangeSpec := tt.clientRangeHeader[6:] // Remove "bytes=" prefix
-				parts := strings.Split(rangeSpec, "-")
-
-				if len(parts) == 2 {
-					partSize := endOffset - startOffset + 1
-					var clientStart, clientEnd int64
-					var parseErr error
-
-					// Parse start offset
-					if parts[0] != "" {
-						clientStart, parseErr = strconv.ParseInt(parts[0], 10, 64)
-						if parseErr != nil {
-							hasError = true
-						}
-					}
-
-					// Parse end offset
-					if parts[1] != "" {
-						clientEnd, parseErr = strconv.ParseInt(parts[1], 10, 64)
-						if parseErr != nil {
-							hasError = true
-						}
-					} else {
-						// No end specified, read to end of part
-						clientEnd = partSize - 1
-					}
-
-					// Handle suffix-range (e.g., "bytes=-100" means last 100 bytes)
-					if parts[0] == "" && !hasError {
-						// suffix-range: clientEnd is actually the suffix length
-						suffixLength := clientEnd
-						if suffixLength > partSize {
-							suffixLength = partSize
-						}
-						clientStart = partSize - suffixLength
-						clientEnd = partSize - 1
-					}
-
-					// Validate range is within part boundaries
-					if !hasError {
-						if clientStart < 0 || clientStart >= partSize {
-							hasError = true
-						} else if clientEnd >= partSize {
-							clientEnd = partSize - 1
-						}
-						if clientStart > clientEnd {
-							hasError = true
-						}
-
-						if !hasError {
-							// Adjust to absolute offsets in the object
-							partStartOffset := startOffset
-							startOffset = partStartOffset + clientStart
-							endOffset = partStartOffset + clientEnd
-						}
-					}
-				}
-			}
+			// Test the actual range adjustment logic from GetObjectHandler
+			startOffset, endOffset, err := adjustRangeForPart(tt.partStartOffset, tt.partEndOffset, tt.clientRangeHeader)

 			if tt.expectError {
-				assert.True(t, hasError, "Expected error for range %s", tt.clientRangeHeader)
+				assert.Error(t, err, "Expected error for range %s", tt.clientRangeHeader)
 			} else {
-				assert.False(t, hasError, "Unexpected error for range %s", tt.clientRangeHeader)
+				assert.NoError(t, err, "Unexpected error for range %s: %v", tt.clientRangeHeader, err)
 				assert.Equal(t, tt.expectedStart, startOffset, "Start offset mismatch")
 				assert.Equal(t, tt.expectedEnd, endOffset, "End offset mismatch")
 			}