You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

202 lines
5.5 KiB

  1. package erasure_coding
  2. import (
  3. "fmt"
  4. "io"
  5. "os"
  6. "github.com/chrislusf/seaweedfs/weed/glog"
  7. "github.com/chrislusf/seaweedfs/weed/storage/idx"
  8. "github.com/chrislusf/seaweedfs/weed/storage/needle_map"
  9. "github.com/chrislusf/seaweedfs/weed/storage/types"
  10. "github.com/klauspost/reedsolomon"
  11. )
  12. const (
  13. DataShardsCount = 10
  14. ParityShardsCount = 4
  15. ErasureCodingLargeBlockSize = 1024 * 1024 * 1024 // 1GB
  16. ErasureCodingSmallBlockSize = 1024 * 1024 // 1MB
  17. )
  18. // WriteSortedEcxFile generates .ecx file from existing .idx file
  19. // all keys are sorted in ascending order
  20. func WriteSortedEcxFile(baseFileName string) (e error) {
  21. cm, err := readCompactMap(baseFileName)
  22. if err != nil {
  23. return fmt.Errorf("readCompactMap: %v", err)
  24. }
  25. ecxFile, err := os.OpenFile(baseFileName+".ecx", os.O_TRUNC|os.O_CREATE|os.O_WRONLY, 0644)
  26. if err != nil {
  27. return fmt.Errorf("failed to open dat file: %v", err)
  28. }
  29. defer ecxFile.Close()
  30. err = cm.AscendingVisit(func(value needle_map.NeedleValue) error {
  31. bytes := value.ToBytes()
  32. _, writeErr := ecxFile.Write(bytes)
  33. return writeErr
  34. })
  35. if err != nil {
  36. return fmt.Errorf("failed to open dat file: %v", err)
  37. }
  38. return nil
  39. }
  40. // WriteEcFiles generates .ec01 ~ .ec14 files
  41. func WriteEcFiles(baseFileName string) error {
  42. return generateEcFiles(baseFileName, 256*1024, ErasureCodingLargeBlockSize, ErasureCodingSmallBlockSize)
  43. }
  44. func ToExt(ecIndex int) string {
  45. return fmt.Sprintf(".ec%02d", ecIndex)
  46. }
  47. func generateEcFiles(baseFileName string, bufferSize int, largeBlockSize int64, smallBlockSize int64) error {
  48. file, err := os.OpenFile(baseFileName+".dat", os.O_RDONLY, 0)
  49. if err != nil {
  50. return fmt.Errorf("failed to open dat file: %v", err)
  51. }
  52. defer file.Close()
  53. fi, err := file.Stat()
  54. if err != nil {
  55. return fmt.Errorf("failed to stat dat file: %v", err)
  56. }
  57. err = encodeDatFile(fi.Size(), err, baseFileName, bufferSize, largeBlockSize, file, smallBlockSize)
  58. if err != nil {
  59. return fmt.Errorf("encodeDatFile: %v", err)
  60. }
  61. return nil
  62. }
  63. func encodeData(file *os.File, enc reedsolomon.Encoder, startOffset, blockSize int64, buffers [][]byte, outputs []*os.File) error {
  64. bufferSize := int64(len(buffers[0]))
  65. batchCount := blockSize / bufferSize
  66. if blockSize%bufferSize != 0 {
  67. glog.Fatalf("unexpected block size %d buffer size %d", blockSize, bufferSize)
  68. }
  69. for b := int64(0); b < batchCount; b++ {
  70. err := encodeDataOneBatch(file, enc, startOffset+b*bufferSize, blockSize, buffers, outputs)
  71. if err != nil {
  72. return err
  73. }
  74. }
  75. return nil
  76. }
  77. func openEcFiles(baseFileName string, forRead bool) (files []*os.File, err error) {
  78. for i := 0; i < DataShardsCount+ParityShardsCount; i++ {
  79. fname := baseFileName + ToExt(i+1)
  80. openOption := os.O_TRUNC | os.O_CREATE | os.O_WRONLY
  81. if forRead {
  82. openOption = os.O_RDONLY
  83. }
  84. f, err := os.OpenFile(fname, openOption, 0644)
  85. if err != nil {
  86. return files, fmt.Errorf("failed to open file %s: %v", fname, err)
  87. }
  88. files = append(files, f)
  89. }
  90. return
  91. }
  92. func closeEcFiles(files []*os.File) {
  93. for _, f := range files {
  94. if f != nil {
  95. f.Close()
  96. }
  97. }
  98. }
  99. func encodeDataOneBatch(file *os.File, enc reedsolomon.Encoder, startOffset, blockSize int64, buffers [][]byte, outputs []*os.File) error {
  100. // read data into buffers
  101. for i := 0; i < DataShardsCount; i++ {
  102. n, err := file.ReadAt(buffers[i], startOffset+blockSize*int64(i))
  103. if err != nil {
  104. if err != io.EOF {
  105. return err
  106. }
  107. }
  108. if n < len(buffers[i]) {
  109. for t := len(buffers[i]) - 1; t >= n; t-- {
  110. buffers[i][t] = 0
  111. }
  112. }
  113. }
  114. err := enc.Encode(buffers)
  115. if err != nil {
  116. return err
  117. }
  118. for i := 0; i < DataShardsCount+ParityShardsCount; i++ {
  119. _, err := outputs[i].Write(buffers[i])
  120. if err != nil {
  121. return err
  122. }
  123. }
  124. return nil
  125. }
  126. func encodeDatFile(remainingSize int64, err error, baseFileName string, bufferSize int, largeBlockSize int64, file *os.File, smallBlockSize int64) error {
  127. var processedSize int64
  128. enc, err := reedsolomon.New(DataShardsCount, ParityShardsCount)
  129. if err != nil {
  130. return fmt.Errorf("failed to create encoder: %v", err)
  131. }
  132. buffers := make([][]byte, DataShardsCount+ParityShardsCount)
  133. outputs, err := openEcFiles(baseFileName, false)
  134. defer closeEcFiles(outputs)
  135. if err != nil {
  136. return fmt.Errorf("failed to open dat file: %v", err)
  137. }
  138. for i, _ := range buffers {
  139. buffers[i] = make([]byte, bufferSize)
  140. }
  141. for remainingSize > largeBlockSize*DataShardsCount {
  142. err = encodeData(file, enc, processedSize, largeBlockSize, buffers, outputs)
  143. if err != nil {
  144. return fmt.Errorf("failed to encode large chunk data: %v", err)
  145. }
  146. remainingSize -= largeBlockSize * DataShardsCount
  147. processedSize += largeBlockSize * DataShardsCount
  148. }
  149. for remainingSize > 0 {
  150. encodeData(file, enc, processedSize, smallBlockSize, buffers, outputs)
  151. if err != nil {
  152. return fmt.Errorf("failed to encode small chunk data: %v", err)
  153. }
  154. remainingSize -= smallBlockSize * DataShardsCount
  155. processedSize += smallBlockSize * DataShardsCount
  156. }
  157. return nil
  158. }
  159. func readCompactMap(baseFileName string) (*needle_map.CompactMap, error) {
  160. indexFile, err := os.OpenFile(baseFileName+".idx", os.O_RDONLY, 0644)
  161. if err != nil {
  162. return nil, fmt.Errorf("cannot read Volume Index %s.idx: %v", baseFileName, err)
  163. }
  164. defer indexFile.Close()
  165. cm := needle_map.NewCompactMap()
  166. err = idx.WalkIndexFile(indexFile, func(key types.NeedleId, offset types.Offset, size uint32) error {
  167. if !offset.IsZero() && size != types.TombstoneFileSize {
  168. cm.Set(key, offset, size)
  169. } else {
  170. cm.Delete(key)
  171. }
  172. return nil
  173. })
  174. return cm, err
  175. }