You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

146 lines
3.5 KiB

7 years ago
5 years ago
  1. package filesys
  2. import (
  3. "bytes"
  4. "io"
  5. "runtime"
  6. "sync"
  7. "time"
  8. "github.com/chrislusf/seaweedfs/weed/glog"
  9. "github.com/chrislusf/seaweedfs/weed/pb/filer_pb"
  10. )
  11. type ContinuousDirtyPages struct {
  12. intervals *ContinuousIntervals
  13. f *File
  14. writeWaitGroup sync.WaitGroup
  15. chunkSaveErrChan chan error
  16. chunkSaveErrChanClosed bool
  17. lastErr error
  18. lock sync.Mutex
  19. collection string
  20. replication string
  21. }
  22. func newDirtyPages(file *File) *ContinuousDirtyPages {
  23. dirtyPages := &ContinuousDirtyPages{
  24. intervals: &ContinuousIntervals{},
  25. f: file,
  26. chunkSaveErrChan: make(chan error, runtime.NumCPU()),
  27. }
  28. go func() {
  29. for t := range dirtyPages.chunkSaveErrChan {
  30. if t != nil {
  31. dirtyPages.lastErr = t
  32. }
  33. }
  34. }()
  35. return dirtyPages
  36. }
  37. func (pages *ContinuousDirtyPages) AddPage(offset int64, data []byte) {
  38. glog.V(4).Infof("%s AddPage [%d,%d) of %d bytes", pages.f.fullpath(), offset, offset+int64(len(data)), pages.f.entry.Attributes.FileSize)
  39. if len(data) > int(pages.f.wfs.option.ChunkSizeLimit) {
  40. // this is more than what buffer can hold.
  41. pages.flushAndSave(offset, data)
  42. }
  43. pages.intervals.AddInterval(data, offset)
  44. if pages.intervals.TotalSize() >= pages.f.wfs.option.ChunkSizeLimit {
  45. pages.saveExistingLargestPageToStorage()
  46. }
  47. return
  48. }
  49. func (pages *ContinuousDirtyPages) flushAndSave(offset int64, data []byte) {
  50. // flush existing
  51. pages.saveExistingPagesToStorage()
  52. // flush the new page
  53. pages.saveToStorage(bytes.NewReader(data), offset, int64(len(data)))
  54. return
  55. }
  56. func (pages *ContinuousDirtyPages) saveExistingPagesToStorage() {
  57. for pages.saveExistingLargestPageToStorage() {
  58. }
  59. }
  60. func (pages *ContinuousDirtyPages) saveExistingLargestPageToStorage() (hasSavedData bool) {
  61. maxList := pages.intervals.RemoveLargestIntervalLinkedList()
  62. if maxList == nil {
  63. return false
  64. }
  65. fileSize := int64(pages.f.entry.Attributes.FileSize)
  66. chunkSize := min(maxList.Size(), fileSize-maxList.Offset())
  67. if chunkSize == 0 {
  68. return false
  69. }
  70. pages.saveToStorage(maxList.ToReader(), maxList.Offset(), chunkSize)
  71. return true
  72. }
  73. func (pages *ContinuousDirtyPages) saveToStorage(reader io.Reader, offset int64, size int64) {
  74. errChanSize := pages.f.wfs.option.ConcurrentWriters
  75. if errChanSize == 0 {
  76. errChanSize = runtime.NumCPU()
  77. }
  78. if pages.chunkSaveErrChanClosed {
  79. pages.chunkSaveErrChan = make(chan error, errChanSize)
  80. pages.chunkSaveErrChanClosed = false
  81. }
  82. mtime := time.Now().UnixNano()
  83. pages.writeWaitGroup.Add(1)
  84. writer := func() {
  85. defer pages.writeWaitGroup.Done()
  86. reader = io.LimitReader(reader, size)
  87. chunk, collection, replication, err := pages.f.wfs.saveDataAsChunk(pages.f.fullpath())(reader, pages.f.Name, offset)
  88. if err != nil {
  89. glog.V(0).Infof("%s saveToStorage [%d,%d): %v", pages.f.fullpath(), offset, offset+size, err)
  90. pages.chunkSaveErrChan <- err
  91. return
  92. }
  93. chunk.Mtime = mtime
  94. pages.collection, pages.replication = collection, replication
  95. pages.f.addChunks([]*filer_pb.FileChunk{chunk})
  96. glog.V(3).Infof("%s saveToStorage [%d,%d)", pages.f.fullpath(), offset, offset+size)
  97. }
  98. if pages.f.wfs.concurrentWriters != nil {
  99. pages.f.wfs.concurrentWriters.Execute(writer)
  100. } else {
  101. go writer()
  102. }
  103. }
  104. func max(x, y int64) int64 {
  105. if x > y {
  106. return x
  107. }
  108. return y
  109. }
  110. func min(x, y int64) int64 {
  111. if x < y {
  112. return x
  113. }
  114. return y
  115. }
  116. func (pages *ContinuousDirtyPages) ReadDirtyDataAt(data []byte, startOffset int64) (maxStop int64) {
  117. return pages.intervals.ReadDataAt(data, startOffset)
  118. }