You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

229 lines
7.1 KiB

4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
2 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
2 years ago
4 years ago
3 years ago
2 years ago
2 years ago
2 years ago
  1. package filer
  2. import (
  3. "context"
  4. "fmt"
  5. "io"
  6. "math/rand"
  7. "sync"
  8. "github.com/seaweedfs/seaweedfs/weed/glog"
  9. "github.com/seaweedfs/seaweedfs/weed/pb/filer_pb"
  10. "github.com/seaweedfs/seaweedfs/weed/util"
  11. "github.com/seaweedfs/seaweedfs/weed/util/chunk_cache"
  12. "github.com/seaweedfs/seaweedfs/weed/wdclient"
  13. )
  14. type ChunkReadAt struct {
  15. masterClient *wdclient.MasterClient
  16. chunkViews []*ChunkView
  17. readerLock sync.Mutex
  18. fileSize int64
  19. readerCache *ReaderCache
  20. readerPattern *ReaderPattern
  21. lastChunkFid string
  22. }
  23. var _ = io.ReaderAt(&ChunkReadAt{})
  24. var _ = io.Closer(&ChunkReadAt{})
  25. func LookupFn(filerClient filer_pb.FilerClient) wdclient.LookupFileIdFunctionType {
  26. vidCache := make(map[string]*filer_pb.Locations)
  27. var vicCacheLock sync.RWMutex
  28. return func(fileId string) (targetUrls []string, err error) {
  29. vid := VolumeId(fileId)
  30. vicCacheLock.RLock()
  31. locations, found := vidCache[vid]
  32. vicCacheLock.RUnlock()
  33. if !found {
  34. util.Retry("lookup volume "+vid, func() error {
  35. err = filerClient.WithFilerClient(false, func(client filer_pb.SeaweedFilerClient) error {
  36. resp, err := client.LookupVolume(context.Background(), &filer_pb.LookupVolumeRequest{
  37. VolumeIds: []string{vid},
  38. })
  39. if err != nil {
  40. return err
  41. }
  42. locations = resp.LocationsMap[vid]
  43. if locations == nil || len(locations.Locations) == 0 {
  44. glog.V(0).Infof("failed to locate %s", fileId)
  45. return fmt.Errorf("failed to locate %s", fileId)
  46. }
  47. vicCacheLock.Lock()
  48. vidCache[vid] = locations
  49. vicCacheLock.Unlock()
  50. return nil
  51. })
  52. return err
  53. })
  54. }
  55. if err != nil {
  56. return nil, err
  57. }
  58. fcDataCenter := filerClient.GetDataCenter()
  59. var sameDcTargetUrls, otherTargetUrls []string
  60. for _, loc := range locations.Locations {
  61. volumeServerAddress := filerClient.AdjustedUrl(loc)
  62. targetUrl := fmt.Sprintf("http://%s/%s", volumeServerAddress, fileId)
  63. if fcDataCenter == "" || fcDataCenter != loc.DataCenter {
  64. otherTargetUrls = append(otherTargetUrls, targetUrl)
  65. } else {
  66. sameDcTargetUrls = append(sameDcTargetUrls, targetUrl)
  67. }
  68. }
  69. rand.Shuffle(len(sameDcTargetUrls), func(i, j int) {
  70. sameDcTargetUrls[i], sameDcTargetUrls[j] = sameDcTargetUrls[j], sameDcTargetUrls[i]
  71. })
  72. rand.Shuffle(len(otherTargetUrls), func(i, j int) {
  73. otherTargetUrls[i], otherTargetUrls[j] = otherTargetUrls[j], otherTargetUrls[i]
  74. })
  75. // Prefer same data center
  76. targetUrls = append(sameDcTargetUrls, otherTargetUrls...)
  77. return
  78. }
  79. }
  80. func NewChunkReaderAtFromClient(lookupFn wdclient.LookupFileIdFunctionType, chunkViews []*ChunkView, chunkCache chunk_cache.ChunkCache, fileSize int64) *ChunkReadAt {
  81. return &ChunkReadAt{
  82. chunkViews: chunkViews,
  83. fileSize: fileSize,
  84. readerCache: newReaderCache(32, chunkCache, lookupFn),
  85. readerPattern: NewReaderPattern(),
  86. }
  87. }
  88. func (c *ChunkReadAt) Close() error {
  89. c.readerCache.destroy()
  90. return nil
  91. }
  92. func (c *ChunkReadAt) ReadAt(p []byte, offset int64) (n int, err error) {
  93. c.readerPattern.MonitorReadAt(offset, len(p))
  94. c.readerLock.Lock()
  95. defer c.readerLock.Unlock()
  96. // glog.V(4).Infof("ReadAt [%d,%d) of total file size %d bytes %d chunk views", offset, offset+int64(len(p)), c.fileSize, len(c.chunkViews))
  97. n, _, err = c.doReadAt(p, offset)
  98. return
  99. }
  100. func (c *ChunkReadAt) ReadAtWithTime(p []byte, offset int64) (n int, ts int64, err error) {
  101. c.readerPattern.MonitorReadAt(offset, len(p))
  102. c.readerLock.Lock()
  103. defer c.readerLock.Unlock()
  104. // glog.V(4).Infof("ReadAt [%d,%d) of total file size %d bytes %d chunk views", offset, offset+int64(len(p)), c.fileSize, len(c.chunkViews))
  105. return c.doReadAt(p, offset)
  106. }
  107. func (c *ChunkReadAt) doReadAt(p []byte, offset int64) (n int, ts int64, err error) {
  108. startOffset, remaining := offset, int64(len(p))
  109. var nextChunks []*ChunkView
  110. for i, chunk := range c.chunkViews {
  111. if remaining <= 0 {
  112. break
  113. }
  114. if i+1 < len(c.chunkViews) {
  115. nextChunks = c.chunkViews[i+1:]
  116. }
  117. if startOffset < chunk.LogicOffset {
  118. gap := chunk.LogicOffset - startOffset
  119. glog.V(4).Infof("zero [%d,%d)", startOffset, chunk.LogicOffset)
  120. n += zero(p, startOffset-offset, gap)
  121. startOffset, remaining = chunk.LogicOffset, remaining-gap
  122. if remaining <= 0 {
  123. break
  124. }
  125. }
  126. // fmt.Printf(">>> doReadAt [%d,%d), chunk[%d,%d)\n", offset, offset+int64(len(p)), chunk.LogicOffset, chunk.LogicOffset+int64(chunk.Size))
  127. chunkStart, chunkStop := max(chunk.LogicOffset, startOffset), min(chunk.LogicOffset+int64(chunk.Size), startOffset+remaining)
  128. if chunkStart >= chunkStop {
  129. continue
  130. }
  131. // glog.V(4).Infof("read [%d,%d), %d/%d chunk %s [%d,%d)", chunkStart, chunkStop, i, len(c.chunkViews), chunk.FileId, chunk.LogicOffset-chunk.Offset, chunk.LogicOffset-chunk.Offset+int64(chunk.Size))
  132. bufferOffset := chunkStart - chunk.LogicOffset + chunk.Offset
  133. ts = chunk.ModifiedTsNs
  134. copied, err := c.readChunkSliceAt(p[startOffset-offset:chunkStop-chunkStart+startOffset-offset], chunk, nextChunks, uint64(bufferOffset))
  135. if err != nil {
  136. glog.Errorf("fetching chunk %+v: %v\n", chunk, err)
  137. return copied, ts, err
  138. }
  139. n += copied
  140. startOffset, remaining = startOffset+int64(copied), remaining-int64(copied)
  141. }
  142. // glog.V(4).Infof("doReadAt [%d,%d), n:%v, err:%v", offset, offset+int64(len(p)), n, err)
  143. // zero the remaining bytes if a gap exists at the end of the last chunk (or a fully sparse file)
  144. if err == nil && remaining > 0 {
  145. var delta int64
  146. if c.fileSize > startOffset {
  147. delta = min(remaining, c.fileSize-startOffset)
  148. startOffset -= offset
  149. } else {
  150. delta = remaining
  151. startOffset = max(startOffset-offset, startOffset-remaining-offset)
  152. }
  153. glog.V(4).Infof("zero2 [%d,%d) of file size %d bytes", startOffset, startOffset+delta, c.fileSize)
  154. n += zero(p, startOffset, delta)
  155. }
  156. if err == nil && offset+int64(len(p)) >= c.fileSize {
  157. err = io.EOF
  158. }
  159. // fmt.Printf("~~~ filled %d, err: %v\n\n", n, err)
  160. return
  161. }
  162. func (c *ChunkReadAt) readChunkSliceAt(buffer []byte, chunkView *ChunkView, nextChunkViews []*ChunkView, offset uint64) (n int, err error) {
  163. if c.readerPattern.IsRandomMode() {
  164. n, err := c.readerCache.chunkCache.ReadChunkAt(buffer, chunkView.FileId, offset)
  165. if n > 0 {
  166. return n, err
  167. }
  168. return fetchChunkRange(buffer, c.readerCache.lookupFileIdFn, chunkView.FileId, chunkView.CipherKey, chunkView.IsGzipped, int64(offset))
  169. }
  170. n, err = c.readerCache.ReadChunkAt(buffer, chunkView.FileId, chunkView.CipherKey, chunkView.IsGzipped, int64(offset), int(chunkView.ChunkSize), chunkView.LogicOffset == 0)
  171. if c.lastChunkFid != chunkView.FileId {
  172. if chunkView.Offset == 0 { // start of a new chunk
  173. if c.lastChunkFid != "" {
  174. c.readerCache.UnCache(c.lastChunkFid)
  175. c.readerCache.MaybeCache(nextChunkViews)
  176. } else {
  177. if len(nextChunkViews) >= 1 {
  178. c.readerCache.MaybeCache(nextChunkViews[:1]) // just read the next chunk if at the very beginning
  179. }
  180. }
  181. }
  182. }
  183. c.lastChunkFid = chunkView.FileId
  184. return
  185. }
  186. func zero(buffer []byte, start, length int64) int {
  187. end := min(start+length, int64(len(buffer)))
  188. start = max(start, 0)
  189. // zero the bytes
  190. for o := start; o < end; o++ {
  191. buffer[o] = 0
  192. }
  193. return int(end - start)
  194. }