You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

301 lines
7.7 KiB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
3 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
  1. package log_buffer
  2. import (
  3. "bytes"
  4. "sync"
  5. "time"
  6. "github.com/golang/protobuf/proto"
  7. "github.com/chrislusf/seaweedfs/weed/glog"
  8. "github.com/chrislusf/seaweedfs/weed/pb/filer_pb"
  9. "github.com/chrislusf/seaweedfs/weed/util"
  10. )
  11. const BufferSize = 4 * 1024 * 1024
  12. const PreviousBufferCount = 3
  13. type dataToFlush struct {
  14. startTime time.Time
  15. stopTime time.Time
  16. data *bytes.Buffer
  17. }
  18. type LogBuffer struct {
  19. name string
  20. prevBuffers *SealedBuffers
  21. buf []byte
  22. idx []int
  23. pos int
  24. startTime time.Time
  25. stopTime time.Time
  26. lastFlushTime time.Time
  27. sizeBuf []byte
  28. flushInterval time.Duration
  29. flushFn func(startTime, stopTime time.Time, buf []byte)
  30. notifyFn func()
  31. isStopping bool
  32. flushChan chan *dataToFlush
  33. lastTsNs int64
  34. sync.RWMutex
  35. }
  36. func NewLogBuffer(name string, flushInterval time.Duration, flushFn func(startTime, stopTime time.Time, buf []byte), notifyFn func()) *LogBuffer {
  37. lb := &LogBuffer{
  38. name: name,
  39. prevBuffers: newSealedBuffers(PreviousBufferCount),
  40. buf: make([]byte, BufferSize),
  41. sizeBuf: make([]byte, 4),
  42. flushInterval: flushInterval,
  43. flushFn: flushFn,
  44. notifyFn: notifyFn,
  45. flushChan: make(chan *dataToFlush, 256),
  46. }
  47. go lb.loopFlush()
  48. go lb.loopInterval()
  49. return lb
  50. }
  51. func (m *LogBuffer) AddToBuffer(partitionKey, data []byte, processingTsNs int64) {
  52. m.Lock()
  53. defer func() {
  54. m.Unlock()
  55. if m.notifyFn != nil {
  56. m.notifyFn()
  57. }
  58. }()
  59. // need to put the timestamp inside the lock
  60. var ts time.Time
  61. if processingTsNs == 0 {
  62. ts = time.Now()
  63. processingTsNs = ts.UnixNano()
  64. } else {
  65. ts = time.Unix(0, processingTsNs)
  66. }
  67. if m.lastTsNs >= processingTsNs {
  68. // this is unlikely to happen, but just in case
  69. processingTsNs = m.lastTsNs + 1
  70. ts = time.Unix(0, processingTsNs)
  71. }
  72. m.lastTsNs = processingTsNs
  73. logEntry := &filer_pb.LogEntry{
  74. TsNs: processingTsNs,
  75. PartitionKeyHash: util.HashToInt32(partitionKey),
  76. Data: data,
  77. }
  78. logEntryData, _ := proto.Marshal(logEntry)
  79. size := len(logEntryData)
  80. if m.pos == 0 {
  81. m.startTime = ts
  82. }
  83. if m.startTime.Add(m.flushInterval).Before(ts) || len(m.buf)-m.pos < size+4 {
  84. // glog.V(4).Infof("%s copyToFlush1 start time %v, ts %v, remaining %d bytes", m.name, m.startTime, ts, len(m.buf)-m.pos)
  85. m.flushChan <- m.copyToFlush()
  86. m.startTime = ts
  87. if len(m.buf) < size+4 {
  88. m.buf = make([]byte, 2*size+4)
  89. }
  90. }
  91. m.stopTime = ts
  92. m.idx = append(m.idx, m.pos)
  93. util.Uint32toBytes(m.sizeBuf, uint32(size))
  94. copy(m.buf[m.pos:m.pos+4], m.sizeBuf)
  95. copy(m.buf[m.pos+4:m.pos+4+size], logEntryData)
  96. m.pos += size + 4
  97. // fmt.Printf("entry size %d total %d count %d, buffer:%p\n", size, m.pos, len(m.idx), m)
  98. }
  99. func (m *LogBuffer) Shutdown() {
  100. m.Lock()
  101. defer m.Unlock()
  102. if m.isStopping {
  103. return
  104. }
  105. m.isStopping = true
  106. toFlush := m.copyToFlush()
  107. m.flushChan <- toFlush
  108. close(m.flushChan)
  109. }
  110. func (m *LogBuffer) loopFlush() {
  111. for d := range m.flushChan {
  112. if d != nil {
  113. // glog.V(4).Infof("%s flush [%v, %v] size %d", m.name, d.startTime, d.stopTime, len(d.data.Bytes()))
  114. m.flushFn(d.startTime, d.stopTime, d.data.Bytes())
  115. d.releaseMemory()
  116. // local logbuffer is different from aggregate logbuffer here
  117. m.lastFlushTime = d.stopTime
  118. }
  119. }
  120. }
  121. func (m *LogBuffer) loopInterval() {
  122. for !m.isStopping {
  123. time.Sleep(m.flushInterval)
  124. m.Lock()
  125. if m.isStopping {
  126. m.Unlock()
  127. return
  128. }
  129. toFlush := m.copyToFlush()
  130. m.flushChan <- toFlush
  131. m.Unlock()
  132. }
  133. }
  134. func (m *LogBuffer) copyToFlush() *dataToFlush {
  135. if m.pos > 0 {
  136. // fmt.Printf("flush buffer %d pos %d empty space %d\n", len(m.buf), m.pos, len(m.buf)-m.pos)
  137. var d *dataToFlush
  138. if m.flushFn != nil {
  139. d = &dataToFlush{
  140. startTime: m.startTime,
  141. stopTime: m.stopTime,
  142. data: copiedBytes(m.buf[:m.pos]),
  143. }
  144. // glog.V(4).Infof("%s flushing [0,%d) with %d entries [%v, %v]", m.name, m.pos, len(m.idx), m.startTime, m.stopTime)
  145. } else {
  146. // glog.V(4).Infof("%s removed from memory [0,%d) with %d entries [%v, %v]", m.name, m.pos, len(m.idx), m.startTime, m.stopTime)
  147. m.lastFlushTime = m.stopTime
  148. }
  149. m.buf = m.prevBuffers.SealBuffer(m.startTime, m.stopTime, m.buf, m.pos)
  150. m.startTime = time.Unix(0, 0)
  151. m.stopTime = time.Unix(0, 0)
  152. m.pos = 0
  153. m.idx = m.idx[:0]
  154. return d
  155. }
  156. return nil
  157. }
  158. func (d *dataToFlush) releaseMemory() {
  159. d.data.Reset()
  160. bufferPool.Put(d.data)
  161. }
  162. func (m *LogBuffer) ReadFromBuffer(lastReadTime time.Time) (bufferCopy *bytes.Buffer, err error) {
  163. m.RLock()
  164. defer m.RUnlock()
  165. if !m.lastFlushTime.IsZero() && m.lastFlushTime.After(lastReadTime) {
  166. if time.Now().Sub(m.lastFlushTime) < m.flushInterval*2 {
  167. diff := m.lastFlushTime.Sub(lastReadTime)
  168. glog.V(4).Infof("lastFlush:%v lastRead:%v diff:%v", m.lastFlushTime, lastReadTime, diff)
  169. return nil, ResumeFromDiskError
  170. }
  171. }
  172. /*
  173. fmt.Printf("read buffer %p: %v last stop time: [%v,%v], pos %d, entries:%d, prevBufs:%d\n", m, lastReadTime, m.startTime, m.stopTime, m.pos, len(m.idx), len(m.prevBuffers.buffers))
  174. for i, prevBuf := range m.prevBuffers.buffers {
  175. fmt.Printf(" prev %d : %s\n", i, prevBuf.String())
  176. }
  177. */
  178. if lastReadTime.Equal(m.stopTime) {
  179. return nil, nil
  180. }
  181. if lastReadTime.After(m.stopTime) {
  182. // glog.Fatalf("unexpected last read time %v, older than latest %v", lastReadTime, m.stopTime)
  183. return nil, nil
  184. }
  185. if lastReadTime.Before(m.startTime) {
  186. // println("checking ", lastReadTime.UnixNano())
  187. for _, buf := range m.prevBuffers.buffers {
  188. if buf.startTime.After(lastReadTime) {
  189. // glog.V(4).Infof("%s return the %d sealed buffer %v", m.name, i, buf.startTime)
  190. // println("return the", i, "th in memory", buf.startTime.UnixNano())
  191. return copiedBytes(buf.buf[:buf.size]), nil
  192. }
  193. if !buf.startTime.After(lastReadTime) && buf.stopTime.After(lastReadTime) {
  194. pos := buf.locateByTs(lastReadTime)
  195. // fmt.Printf("locate buffer[%d] pos %d\n", i, pos)
  196. return copiedBytes(buf.buf[pos:buf.size]), nil
  197. }
  198. }
  199. // glog.V(4).Infof("%s return the current buf %v", m.name, lastReadTime)
  200. return copiedBytes(m.buf[:m.pos]), nil
  201. }
  202. lastTs := lastReadTime.UnixNano()
  203. l, h := 0, len(m.idx)-1
  204. /*
  205. for i, pos := range m.idx {
  206. logEntry, ts := readTs(m.buf, pos)
  207. event := &filer_pb.SubscribeMetadataResponse{}
  208. proto.Unmarshal(logEntry.Data, event)
  209. entry := event.EventNotification.OldEntry
  210. if entry == nil {
  211. entry = event.EventNotification.NewEntry
  212. }
  213. fmt.Printf("entry %d ts: %v offset:%d dir:%s name:%s\n", i, time.Unix(0, ts), pos, event.Directory, entry.Name)
  214. }
  215. fmt.Printf("l=%d, h=%d\n", l, h)
  216. */
  217. for l <= h {
  218. mid := (l + h) / 2
  219. pos := m.idx[mid]
  220. _, t := readTs(m.buf, pos)
  221. if t <= lastTs {
  222. l = mid + 1
  223. } else if lastTs < t {
  224. var prevT int64
  225. if mid > 0 {
  226. _, prevT = readTs(m.buf, m.idx[mid-1])
  227. }
  228. if prevT <= lastTs {
  229. // fmt.Printf("found l=%d, m-1=%d(ts=%d), m=%d(ts=%d), h=%d [%d, %d) \n", l, mid-1, prevT, mid, t, h, pos, m.pos)
  230. return copiedBytes(m.buf[pos:m.pos]), nil
  231. }
  232. h = mid
  233. }
  234. // fmt.Printf("l=%d, h=%d\n", l, h)
  235. }
  236. // FIXME: this could be that the buffer has been flushed already
  237. return nil, nil
  238. }
  239. func (m *LogBuffer) ReleaseMemory(b *bytes.Buffer) {
  240. bufferPool.Put(b)
  241. }
  242. var bufferPool = sync.Pool{
  243. New: func() interface{} {
  244. return new(bytes.Buffer)
  245. },
  246. }
  247. func copiedBytes(buf []byte) (copied *bytes.Buffer) {
  248. copied = bufferPool.Get().(*bytes.Buffer)
  249. copied.Reset()
  250. copied.Write(buf)
  251. return
  252. }
  253. func readTs(buf []byte, pos int) (size int, ts int64) {
  254. size = int(util.BytesToUint32(buf[pos : pos+4]))
  255. entryData := buf[pos+4 : pos+4+size]
  256. logEntry := &filer_pb.LogEntry{}
  257. err := proto.Unmarshal(entryData, logEntry)
  258. if err != nil {
  259. glog.Fatalf("unexpected unmarshal filer_pb.LogEntry: %v", err)
  260. }
  261. return size, logEntry.TsNs
  262. }