You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

214 lines
5.5 KiB

6 years ago
6 years ago
6 years ago
  1. package erasure_coding
  2. import (
  3. "bytes"
  4. "fmt"
  5. "math/rand"
  6. "os"
  7. "testing"
  8. "github.com/chrislusf/seaweedfs/weed/storage/needle_map"
  9. "github.com/chrislusf/seaweedfs/weed/storage/types"
  10. "github.com/klauspost/reedsolomon"
  11. )
  12. const (
  13. largeBlockSize = 10000
  14. smallBlockSize = 100
  15. )
  16. func TestEncodingDecoding(t *testing.T) {
  17. bufferSize := 50
  18. baseFileName := "1"
  19. err := generateEcFiles(baseFileName, bufferSize, largeBlockSize, smallBlockSize)
  20. if err != nil {
  21. t.Logf("generateEcFiles: %v", err)
  22. }
  23. err = WriteSortedEcxFile(baseFileName)
  24. if err != nil {
  25. t.Logf("WriteSortedEcxFile: %v", err)
  26. }
  27. err = validateFiles(baseFileName)
  28. if err != nil {
  29. t.Logf("WriteSortedEcxFile: %v", err)
  30. }
  31. removeGeneratedFiles(baseFileName)
  32. }
  33. func validateFiles(baseFileName string) error {
  34. cm, err := readCompactMap(baseFileName)
  35. if err != nil {
  36. return fmt.Errorf("readCompactMap: %v", err)
  37. }
  38. datFile, err := os.OpenFile(baseFileName+".dat", os.O_RDONLY, 0)
  39. if err != nil {
  40. return fmt.Errorf("failed to open dat file: %v", err)
  41. }
  42. defer datFile.Close()
  43. fi, err := datFile.Stat()
  44. if err != nil {
  45. return fmt.Errorf("failed to stat dat file: %v", err)
  46. }
  47. ecFiles, err := openEcFiles(baseFileName, true)
  48. defer closeEcFiles(ecFiles)
  49. err = cm.AscendingVisit(func(value needle_map.NeedleValue) error {
  50. return assertSame(datFile, fi.Size(), ecFiles, value.Offset, value.Size)
  51. })
  52. if err != nil {
  53. return fmt.Errorf("failed to check ec files: %v", err)
  54. }
  55. return nil
  56. }
  57. func assertSame(datFile *os.File, datSize int64, ecFiles []*os.File, offset types.Offset, size uint32) error {
  58. data, err := readDatFile(datFile, offset, size)
  59. if err != nil {
  60. return fmt.Errorf("failed to read dat file: %v", err)
  61. }
  62. ecData, err := readEcFile(datSize, ecFiles, offset, size)
  63. if err != nil {
  64. return fmt.Errorf("failed to read ec file: %v", err)
  65. }
  66. if bytes.Compare(data, ecData) != 0 {
  67. return fmt.Errorf("unexpected data read")
  68. }
  69. return nil
  70. }
  71. func readDatFile(datFile *os.File, offset types.Offset, size uint32) ([]byte, error) {
  72. data := make([]byte, size)
  73. n, err := datFile.ReadAt(data, offset.ToAcutalOffset())
  74. if err != nil {
  75. return nil, fmt.Errorf("failed to ReadAt dat file: %v", err)
  76. }
  77. if n != int(size) {
  78. return nil, fmt.Errorf("unexpected read size %d, expected %d", n, size)
  79. }
  80. return data, nil
  81. }
  82. func readEcFile(datSize int64, ecFiles []*os.File, offset types.Offset, size uint32) (data []byte, err error) {
  83. intervals := locateData(largeBlockSize, smallBlockSize, datSize, offset.ToAcutalOffset(), size)
  84. nLargeBlockRows := int(datSize / (largeBlockSize * DataShardsCount))
  85. for i, interval := range intervals {
  86. if d, e := readOneInterval(interval, ecFiles, nLargeBlockRows); e != nil {
  87. return nil, e
  88. } else {
  89. if i == 0 {
  90. data = d
  91. } else {
  92. data = append(data, d...)
  93. }
  94. }
  95. }
  96. return data, nil
  97. }
  98. func readOneInterval(interval Interval, ecFiles []*os.File, nLargeBlockRows int) (data []byte, err error) {
  99. ecFileOffset := interval.innerBlockOffset
  100. rowIndex := interval.blockIndex / DataShardsCount
  101. if interval.isLargeBlock {
  102. ecFileOffset += int64(rowIndex) * largeBlockSize
  103. } else {
  104. ecFileOffset += int64(nLargeBlockRows)*largeBlockSize + int64(rowIndex)*smallBlockSize
  105. }
  106. ecFileIndex := interval.blockIndex % DataShardsCount
  107. data = make([]byte, interval.size)
  108. err = readFromFile(ecFiles[ecFileIndex], data, ecFileOffset)
  109. { // do some ec testing
  110. ecData, err := readFromOtherEcFiles(ecFiles, ecFileIndex, ecFileOffset, interval.size)
  111. if err != nil {
  112. return nil, fmt.Errorf("ec reconstruct error: %v", err)
  113. }
  114. if bytes.Compare(data, ecData) != 0 {
  115. return nil, fmt.Errorf("ec compare error")
  116. }
  117. }
  118. return
  119. }
  120. func readFromOtherEcFiles(ecFiles []*os.File, ecFileIndex int, ecFileOffset int64, size uint32) (data []byte, err error) {
  121. enc, err := reedsolomon.New(DataShardsCount, ParityShardsCount)
  122. if err != nil {
  123. return nil, fmt.Errorf("failed to create encoder: %v", err)
  124. }
  125. bufs := make([][]byte, TotalShardsCount)
  126. for i := 0; i < DataShardsCount; {
  127. n := int(rand.Int31n(TotalShardsCount))
  128. if n == ecFileIndex || bufs[n] != nil {
  129. continue
  130. }
  131. bufs[n] = make([]byte, size)
  132. i++
  133. }
  134. for i, buf := range bufs {
  135. if buf == nil {
  136. continue
  137. }
  138. err = readFromFile(ecFiles[i], buf, ecFileOffset)
  139. if err != nil {
  140. return
  141. }
  142. }
  143. if err = enc.ReconstructData(bufs); err != nil {
  144. return nil, err
  145. }
  146. return bufs[ecFileIndex], nil
  147. }
  148. func readFromFile(file *os.File, data []byte, ecFileOffset int64) (err error) {
  149. _, err = file.ReadAt(data, ecFileOffset)
  150. return
  151. }
  152. func removeGeneratedFiles(baseFileName string) {
  153. for i := 0; i < DataShardsCount+ParityShardsCount; i++ {
  154. fname := fmt.Sprintf("%s.ec%02d", baseFileName, i+1)
  155. os.Remove(fname)
  156. }
  157. os.Remove(baseFileName + ".ecx")
  158. }
  159. func TestLocateData(t *testing.T) {
  160. intervals := locateData(largeBlockSize, smallBlockSize, DataShardsCount*largeBlockSize+1, DataShardsCount*largeBlockSize, 1)
  161. if len(intervals) != 1 {
  162. t.Errorf("unexpected interval size %d", len(intervals))
  163. }
  164. if !intervals[0].sameAs(Interval{0, 0, 1, false}) {
  165. t.Errorf("unexpected interval %+v", intervals[0])
  166. }
  167. intervals = locateData(largeBlockSize, smallBlockSize, DataShardsCount*largeBlockSize+1, DataShardsCount*largeBlockSize/2+100, DataShardsCount*largeBlockSize+1-DataShardsCount*largeBlockSize/2-100)
  168. fmt.Printf("%+v\n", intervals)
  169. }
  170. func (this Interval) sameAs(that Interval) bool {
  171. return this.isLargeBlock == that.isLargeBlock &&
  172. this.innerBlockOffset == that.innerBlockOffset &&
  173. this.blockIndex == that.blockIndex &&
  174. this.size == that.size
  175. }