|
|
@ -11,6 +11,7 @@ import ( |
|
|
"github.com/seaweedfs/seaweedfs/weed/storage/idx" |
|
|
"github.com/seaweedfs/seaweedfs/weed/storage/idx" |
|
|
"github.com/seaweedfs/seaweedfs/weed/storage/needle_map" |
|
|
"github.com/seaweedfs/seaweedfs/weed/storage/needle_map" |
|
|
"github.com/seaweedfs/seaweedfs/weed/storage/types" |
|
|
"github.com/seaweedfs/seaweedfs/weed/storage/types" |
|
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/storage/volume_info" |
|
|
"github.com/seaweedfs/seaweedfs/weed/util" |
|
|
"github.com/seaweedfs/seaweedfs/weed/util" |
|
|
) |
|
|
) |
|
|
|
|
|
|
|
|
@ -18,6 +19,7 @@ const ( |
|
|
DataShardsCount = 10 |
|
|
DataShardsCount = 10 |
|
|
ParityShardsCount = 4 |
|
|
ParityShardsCount = 4 |
|
|
TotalShardsCount = DataShardsCount + ParityShardsCount |
|
|
TotalShardsCount = DataShardsCount + ParityShardsCount |
|
|
|
|
|
MaxShardCount = 32 // Maximum number of shards since ShardBits is uint32 (bits 0-31)
|
|
|
MinTotalDisks = TotalShardsCount/ParityShardsCount + 1 |
|
|
MinTotalDisks = TotalShardsCount/ParityShardsCount + 1 |
|
|
ErasureCodingLargeBlockSize = 1024 * 1024 * 1024 // 1GB
|
|
|
ErasureCodingLargeBlockSize = 1024 * 1024 * 1024 // 1GB
|
|
|
ErasureCodingSmallBlockSize = 1024 * 1024 // 1MB
|
|
|
ErasureCodingSmallBlockSize = 1024 * 1024 // 1MB
|
|
|
@ -54,20 +56,53 @@ func WriteSortedFileFromIdx(baseFileName string, ext string) (e error) { |
|
|
return nil |
|
|
return nil |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
// WriteEcFiles generates .ec00 ~ .ec13 files
|
|
|
|
|
|
|
|
|
// WriteEcFiles generates .ec00 ~ .ec13 files using default EC context
|
|
|
func WriteEcFiles(baseFileName string) error { |
|
|
func WriteEcFiles(baseFileName string) error { |
|
|
return generateEcFiles(baseFileName, 256*1024, ErasureCodingLargeBlockSize, ErasureCodingSmallBlockSize) |
|
|
|
|
|
|
|
|
ctx := NewDefaultECContext("", 0) |
|
|
|
|
|
return WriteEcFilesWithContext(baseFileName, ctx) |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
// WriteEcFilesWithContext generates EC files using the provided context
|
|
|
|
|
|
func WriteEcFilesWithContext(baseFileName string, ctx *ECContext) error { |
|
|
|
|
|
return generateEcFiles(baseFileName, 256*1024, ErasureCodingLargeBlockSize, ErasureCodingSmallBlockSize, ctx) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func RebuildEcFiles(baseFileName string) ([]uint32, error) { |
|
|
func RebuildEcFiles(baseFileName string) ([]uint32, error) { |
|
|
return generateMissingEcFiles(baseFileName, 256*1024, ErasureCodingLargeBlockSize, ErasureCodingSmallBlockSize) |
|
|
|
|
|
|
|
|
// Attempt to load EC config from .vif file to preserve original configuration
|
|
|
|
|
|
var ctx *ECContext |
|
|
|
|
|
if volumeInfo, _, found, _ := volume_info.MaybeLoadVolumeInfo(baseFileName + ".vif"); found && volumeInfo.EcShardConfig != nil { |
|
|
|
|
|
ds := int(volumeInfo.EcShardConfig.DataShards) |
|
|
|
|
|
ps := int(volumeInfo.EcShardConfig.ParityShards) |
|
|
|
|
|
|
|
|
|
|
|
// Validate EC config before using it
|
|
|
|
|
|
if ds > 0 && ps > 0 && ds+ps <= MaxShardCount { |
|
|
|
|
|
ctx = &ECContext{ |
|
|
|
|
|
DataShards: ds, |
|
|
|
|
|
ParityShards: ps, |
|
|
|
|
|
} |
|
|
|
|
|
glog.V(0).Infof("Rebuilding EC files for %s with config from .vif: %s", baseFileName, ctx.String()) |
|
|
|
|
|
} else { |
|
|
|
|
|
glog.Warningf("Invalid EC config in .vif for %s (data=%d, parity=%d), using default", baseFileName, ds, ps) |
|
|
|
|
|
ctx = NewDefaultECContext("", 0) |
|
|
|
|
|
} |
|
|
|
|
|
} else { |
|
|
|
|
|
glog.V(0).Infof("Rebuilding EC files for %s with default config", baseFileName) |
|
|
|
|
|
ctx = NewDefaultECContext("", 0) |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
return RebuildEcFilesWithContext(baseFileName, ctx) |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
// RebuildEcFilesWithContext rebuilds missing EC files using the provided context
|
|
|
|
|
|
func RebuildEcFilesWithContext(baseFileName string, ctx *ECContext) ([]uint32, error) { |
|
|
|
|
|
return generateMissingEcFiles(baseFileName, 256*1024, ErasureCodingLargeBlockSize, ErasureCodingSmallBlockSize, ctx) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func ToExt(ecIndex int) string { |
|
|
func ToExt(ecIndex int) string { |
|
|
return fmt.Sprintf(".ec%02d", ecIndex) |
|
|
return fmt.Sprintf(".ec%02d", ecIndex) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func generateEcFiles(baseFileName string, bufferSize int, largeBlockSize int64, smallBlockSize int64) error { |
|
|
|
|
|
|
|
|
func generateEcFiles(baseFileName string, bufferSize int, largeBlockSize int64, smallBlockSize int64, ctx *ECContext) error { |
|
|
file, err := os.OpenFile(baseFileName+".dat", os.O_RDONLY, 0) |
|
|
file, err := os.OpenFile(baseFileName+".dat", os.O_RDONLY, 0) |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return fmt.Errorf("failed to open dat file: %w", err) |
|
|
return fmt.Errorf("failed to open dat file: %w", err) |
|
|
@ -79,21 +114,21 @@ func generateEcFiles(baseFileName string, bufferSize int, largeBlockSize int64, |
|
|
return fmt.Errorf("failed to stat dat file: %w", err) |
|
|
return fmt.Errorf("failed to stat dat file: %w", err) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
glog.V(0).Infof("encodeDatFile %s.dat size:%d", baseFileName, fi.Size()) |
|
|
|
|
|
err = encodeDatFile(fi.Size(), baseFileName, bufferSize, largeBlockSize, file, smallBlockSize) |
|
|
|
|
|
|
|
|
glog.V(0).Infof("encodeDatFile %s.dat size:%d with EC context %s", baseFileName, fi.Size(), ctx.String()) |
|
|
|
|
|
err = encodeDatFile(fi.Size(), baseFileName, bufferSize, largeBlockSize, file, smallBlockSize, ctx) |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return fmt.Errorf("encodeDatFile: %w", err) |
|
|
return fmt.Errorf("encodeDatFile: %w", err) |
|
|
} |
|
|
} |
|
|
return nil |
|
|
return nil |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func generateMissingEcFiles(baseFileName string, bufferSize int, largeBlockSize int64, smallBlockSize int64) (generatedShardIds []uint32, err error) { |
|
|
|
|
|
|
|
|
func generateMissingEcFiles(baseFileName string, bufferSize int, largeBlockSize int64, smallBlockSize int64, ctx *ECContext) (generatedShardIds []uint32, err error) { |
|
|
|
|
|
|
|
|
shardHasData := make([]bool, TotalShardsCount) |
|
|
|
|
|
inputFiles := make([]*os.File, TotalShardsCount) |
|
|
|
|
|
outputFiles := make([]*os.File, TotalShardsCount) |
|
|
|
|
|
for shardId := 0; shardId < TotalShardsCount; shardId++ { |
|
|
|
|
|
shardFileName := baseFileName + ToExt(shardId) |
|
|
|
|
|
|
|
|
shardHasData := make([]bool, ctx.Total()) |
|
|
|
|
|
inputFiles := make([]*os.File, ctx.Total()) |
|
|
|
|
|
outputFiles := make([]*os.File, ctx.Total()) |
|
|
|
|
|
for shardId := 0; shardId < ctx.Total(); shardId++ { |
|
|
|
|
|
shardFileName := baseFileName + ctx.ToExt(shardId) |
|
|
if util.FileExists(shardFileName) { |
|
|
if util.FileExists(shardFileName) { |
|
|
shardHasData[shardId] = true |
|
|
shardHasData[shardId] = true |
|
|
inputFiles[shardId], err = os.OpenFile(shardFileName, os.O_RDONLY, 0) |
|
|
inputFiles[shardId], err = os.OpenFile(shardFileName, os.O_RDONLY, 0) |
|
|
@ -111,14 +146,14 @@ func generateMissingEcFiles(baseFileName string, bufferSize int, largeBlockSize |
|
|
} |
|
|
} |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
err = rebuildEcFiles(shardHasData, inputFiles, outputFiles) |
|
|
|
|
|
|
|
|
err = rebuildEcFiles(shardHasData, inputFiles, outputFiles, ctx) |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return nil, fmt.Errorf("rebuildEcFiles: %w", err) |
|
|
return nil, fmt.Errorf("rebuildEcFiles: %w", err) |
|
|
} |
|
|
} |
|
|
return |
|
|
return |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func encodeData(file *os.File, enc reedsolomon.Encoder, startOffset, blockSize int64, buffers [][]byte, outputs []*os.File) error { |
|
|
|
|
|
|
|
|
func encodeData(file *os.File, enc reedsolomon.Encoder, startOffset, blockSize int64, buffers [][]byte, outputs []*os.File, ctx *ECContext) error { |
|
|
|
|
|
|
|
|
bufferSize := int64(len(buffers[0])) |
|
|
bufferSize := int64(len(buffers[0])) |
|
|
if bufferSize == 0 { |
|
|
if bufferSize == 0 { |
|
|
@ -131,7 +166,7 @@ func encodeData(file *os.File, enc reedsolomon.Encoder, startOffset, blockSize i |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
for b := int64(0); b < batchCount; b++ { |
|
|
for b := int64(0); b < batchCount; b++ { |
|
|
err := encodeDataOneBatch(file, enc, startOffset+b*bufferSize, blockSize, buffers, outputs) |
|
|
|
|
|
|
|
|
err := encodeDataOneBatch(file, enc, startOffset+b*bufferSize, blockSize, buffers, outputs, ctx) |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return err |
|
|
return err |
|
|
} |
|
|
} |
|
|
@ -140,9 +175,9 @@ func encodeData(file *os.File, enc reedsolomon.Encoder, startOffset, blockSize i |
|
|
return nil |
|
|
return nil |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func openEcFiles(baseFileName string, forRead bool) (files []*os.File, err error) { |
|
|
|
|
|
for i := 0; i < TotalShardsCount; i++ { |
|
|
|
|
|
fname := baseFileName + ToExt(i) |
|
|
|
|
|
|
|
|
func openEcFiles(baseFileName string, forRead bool, ctx *ECContext) (files []*os.File, err error) { |
|
|
|
|
|
for i := 0; i < ctx.Total(); i++ { |
|
|
|
|
|
fname := baseFileName + ctx.ToExt(i) |
|
|
openOption := os.O_TRUNC | os.O_CREATE | os.O_WRONLY |
|
|
openOption := os.O_TRUNC | os.O_CREATE | os.O_WRONLY |
|
|
if forRead { |
|
|
if forRead { |
|
|
openOption = os.O_RDONLY |
|
|
openOption = os.O_RDONLY |
|
|
@ -164,10 +199,10 @@ func closeEcFiles(files []*os.File) { |
|
|
} |
|
|
} |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func encodeDataOneBatch(file *os.File, enc reedsolomon.Encoder, startOffset, blockSize int64, buffers [][]byte, outputs []*os.File) error { |
|
|
|
|
|
|
|
|
func encodeDataOneBatch(file *os.File, enc reedsolomon.Encoder, startOffset, blockSize int64, buffers [][]byte, outputs []*os.File, ctx *ECContext) error { |
|
|
|
|
|
|
|
|
// read data into buffers
|
|
|
// read data into buffers
|
|
|
for i := 0; i < DataShardsCount; i++ { |
|
|
|
|
|
|
|
|
for i := 0; i < ctx.DataShards; i++ { |
|
|
n, err := file.ReadAt(buffers[i], startOffset+blockSize*int64(i)) |
|
|
n, err := file.ReadAt(buffers[i], startOffset+blockSize*int64(i)) |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
if err != io.EOF { |
|
|
if err != io.EOF { |
|
|
@ -186,7 +221,7 @@ func encodeDataOneBatch(file *os.File, enc reedsolomon.Encoder, startOffset, blo |
|
|
return err |
|
|
return err |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
for i := 0; i < TotalShardsCount; i++ { |
|
|
|
|
|
|
|
|
for i := 0; i < ctx.Total(); i++ { |
|
|
_, err := outputs[i].Write(buffers[i]) |
|
|
_, err := outputs[i].Write(buffers[i]) |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return err |
|
|
return err |
|
|
@ -196,53 +231,57 @@ func encodeDataOneBatch(file *os.File, enc reedsolomon.Encoder, startOffset, blo |
|
|
return nil |
|
|
return nil |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func encodeDatFile(remainingSize int64, baseFileName string, bufferSize int, largeBlockSize int64, file *os.File, smallBlockSize int64) error { |
|
|
|
|
|
|
|
|
func encodeDatFile(remainingSize int64, baseFileName string, bufferSize int, largeBlockSize int64, file *os.File, smallBlockSize int64, ctx *ECContext) error { |
|
|
|
|
|
|
|
|
var processedSize int64 |
|
|
var processedSize int64 |
|
|
|
|
|
|
|
|
enc, err := reedsolomon.New(DataShardsCount, ParityShardsCount) |
|
|
|
|
|
|
|
|
enc, err := ctx.CreateEncoder() |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return fmt.Errorf("failed to create encoder: %w", err) |
|
|
return fmt.Errorf("failed to create encoder: %w", err) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
buffers := make([][]byte, TotalShardsCount) |
|
|
|
|
|
|
|
|
buffers := make([][]byte, ctx.Total()) |
|
|
for i := range buffers { |
|
|
for i := range buffers { |
|
|
buffers[i] = make([]byte, bufferSize) |
|
|
buffers[i] = make([]byte, bufferSize) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
outputs, err := openEcFiles(baseFileName, false) |
|
|
|
|
|
|
|
|
outputs, err := openEcFiles(baseFileName, false, ctx) |
|
|
defer closeEcFiles(outputs) |
|
|
defer closeEcFiles(outputs) |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return fmt.Errorf("failed to open ec files %s: %v", baseFileName, err) |
|
|
return fmt.Errorf("failed to open ec files %s: %v", baseFileName, err) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
for remainingSize > largeBlockSize*DataShardsCount { |
|
|
|
|
|
err = encodeData(file, enc, processedSize, largeBlockSize, buffers, outputs) |
|
|
|
|
|
|
|
|
// Pre-calculate row sizes to avoid redundant calculations in loops
|
|
|
|
|
|
largeRowSize := largeBlockSize * int64(ctx.DataShards) |
|
|
|
|
|
smallRowSize := smallBlockSize * int64(ctx.DataShards) |
|
|
|
|
|
|
|
|
|
|
|
for remainingSize >= largeRowSize { |
|
|
|
|
|
err = encodeData(file, enc, processedSize, largeBlockSize, buffers, outputs, ctx) |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return fmt.Errorf("failed to encode large chunk data: %w", err) |
|
|
return fmt.Errorf("failed to encode large chunk data: %w", err) |
|
|
} |
|
|
} |
|
|
remainingSize -= largeBlockSize * DataShardsCount |
|
|
|
|
|
processedSize += largeBlockSize * DataShardsCount |
|
|
|
|
|
|
|
|
remainingSize -= largeRowSize |
|
|
|
|
|
processedSize += largeRowSize |
|
|
} |
|
|
} |
|
|
for remainingSize > 0 { |
|
|
for remainingSize > 0 { |
|
|
err = encodeData(file, enc, processedSize, smallBlockSize, buffers, outputs) |
|
|
|
|
|
|
|
|
err = encodeData(file, enc, processedSize, smallBlockSize, buffers, outputs, ctx) |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return fmt.Errorf("failed to encode small chunk data: %w", err) |
|
|
return fmt.Errorf("failed to encode small chunk data: %w", err) |
|
|
} |
|
|
} |
|
|
remainingSize -= smallBlockSize * DataShardsCount |
|
|
|
|
|
processedSize += smallBlockSize * DataShardsCount |
|
|
|
|
|
|
|
|
remainingSize -= smallRowSize |
|
|
|
|
|
processedSize += smallRowSize |
|
|
} |
|
|
} |
|
|
return nil |
|
|
return nil |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func rebuildEcFiles(shardHasData []bool, inputFiles []*os.File, outputFiles []*os.File) error { |
|
|
|
|
|
|
|
|
func rebuildEcFiles(shardHasData []bool, inputFiles []*os.File, outputFiles []*os.File, ctx *ECContext) error { |
|
|
|
|
|
|
|
|
enc, err := reedsolomon.New(DataShardsCount, ParityShardsCount) |
|
|
|
|
|
|
|
|
enc, err := ctx.CreateEncoder() |
|
|
if err != nil { |
|
|
if err != nil { |
|
|
return fmt.Errorf("failed to create encoder: %w", err) |
|
|
return fmt.Errorf("failed to create encoder: %w", err) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
buffers := make([][]byte, TotalShardsCount) |
|
|
|
|
|
|
|
|
buffers := make([][]byte, ctx.Total()) |
|
|
for i := range buffers { |
|
|
for i := range buffers { |
|
|
if shardHasData[i] { |
|
|
if shardHasData[i] { |
|
|
buffers[i] = make([]byte, ErasureCodingSmallBlockSize) |
|
|
buffers[i] = make([]byte, ErasureCodingSmallBlockSize) |
|
|
@ -254,7 +293,7 @@ func rebuildEcFiles(shardHasData []bool, inputFiles []*os.File, outputFiles []*o |
|
|
for { |
|
|
for { |
|
|
|
|
|
|
|
|
// read the input data from files
|
|
|
// read the input data from files
|
|
|
for i := 0; i < TotalShardsCount; i++ { |
|
|
|
|
|
|
|
|
for i := 0; i < ctx.Total(); i++ { |
|
|
if shardHasData[i] { |
|
|
if shardHasData[i] { |
|
|
n, _ := inputFiles[i].ReadAt(buffers[i], startOffset) |
|
|
n, _ := inputFiles[i].ReadAt(buffers[i], startOffset) |
|
|
if n == 0 { |
|
|
if n == 0 { |
|
|
@ -278,7 +317,7 @@ func rebuildEcFiles(shardHasData []bool, inputFiles []*os.File, outputFiles []*o |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
// write the data to output files
|
|
|
// write the data to output files
|
|
|
for i := 0; i < TotalShardsCount; i++ { |
|
|
|
|
|
|
|
|
for i := 0; i < ctx.Total(); i++ { |
|
|
if !shardHasData[i] { |
|
|
if !shardHasData[i] { |
|
|
n, _ := outputFiles[i].WriteAt(buffers[i][:inputBufferDataSize], startOffset) |
|
|
n, _ := outputFiles[i].WriteAt(buffers[i][:inputBufferDataSize], startOffset) |
|
|
if inputBufferDataSize != n { |
|
|
if inputBufferDataSize != n { |
|
|
|