You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

385 lines
9.7 KiB

12 years ago
12 years ago
12 years ago
  1. package storage
  2. import (
  3. "bytes"
  4. "errors"
  5. "fmt"
  6. "io"
  7. "log"
  8. "os"
  9. "path"
  10. "sync"
  11. )
  12. const (
  13. SuperBlockSize = 8
  14. )
  15. type SuperBlock struct {
  16. Version Version
  17. ReplicaType ReplicationType
  18. }
  19. func (s *SuperBlock) Bytes() []byte {
  20. header := make([]byte, SuperBlockSize)
  21. header[0] = byte(s.Version)
  22. header[1] = s.ReplicaType.Byte()
  23. return header
  24. }
  25. type Volume struct {
  26. Id VolumeId
  27. dir string
  28. dataFile *os.File
  29. nm NeedleMapper
  30. readOnly bool
  31. SuperBlock
  32. accessLock sync.Mutex
  33. }
  34. func NewVolume(dirname string, id VolumeId, replicationType ReplicationType) (v *Volume, e error) {
  35. v = &Volume{dir: dirname, Id: id}
  36. v.SuperBlock = SuperBlock{ReplicaType: replicationType}
  37. e = v.load(true)
  38. return
  39. }
  40. func LoadVolumeOnly(dirname string, id VolumeId) (v *Volume, e error) {
  41. v = &Volume{dir: dirname, Id: id}
  42. v.SuperBlock = SuperBlock{ReplicaType: CopyNil}
  43. e = v.load(false)
  44. return
  45. }
  46. func (v *Volume) load(alsoLoadIndex bool) error {
  47. var e error
  48. fileName := path.Join(v.dir, v.Id.String())
  49. v.dataFile, e = os.OpenFile(fileName+".dat", os.O_RDWR|os.O_CREATE, 0644)
  50. if e != nil {
  51. if !os.IsPermission(e) {
  52. return fmt.Errorf("cannot create Volume Data %s.dat: %s", fileName, e)
  53. }
  54. if v.dataFile, e = os.Open(fileName + ".dat"); e != nil {
  55. return fmt.Errorf("cannot open Volume Data %s.dat: %s", fileName, e)
  56. }
  57. log.Printf("opening " + fileName + ".dat in READONLY mode")
  58. v.readOnly = true
  59. }
  60. if v.ReplicaType == CopyNil {
  61. e = v.readSuperBlock()
  62. } else {
  63. e = v.maybeWriteSuperBlock()
  64. }
  65. if e == nil && alsoLoadIndex {
  66. var indexFile *os.File
  67. if v.readOnly {
  68. if indexFile, e = os.Open(fileName + ".idx"); e != nil && !os.IsNotExist(e) {
  69. return fmt.Errorf("cannot open index file %s.idx: %s", fileName, e)
  70. }
  71. if indexFile != nil {
  72. log.Printf("converting %s.idx to %s.cdb", fileName, fileName)
  73. if e = ConvertIndexToCdb(fileName+".cdb", indexFile); e != nil {
  74. log.Printf("error converting %s.idx to %s.cdb: %s", fileName, fileName)
  75. } else {
  76. indexFile.Close()
  77. os.Remove(indexFile.Name())
  78. indexFile = nil
  79. }
  80. }
  81. v.nm, e = OpenCdbMap(fileName + ".cdb")
  82. return e
  83. } else {
  84. indexFile, e = os.OpenFile(fileName+".idx", os.O_RDWR|os.O_CREATE, 0644)
  85. if e != nil {
  86. return fmt.Errorf("cannot create Volume Data %s.dat: %s", fileName, e)
  87. }
  88. }
  89. v.nm, e = LoadNeedleMap(indexFile)
  90. }
  91. return e
  92. }
  93. func (v *Volume) Version() Version {
  94. return v.SuperBlock.Version
  95. }
  96. func (v *Volume) Size() int64 {
  97. v.accessLock.Lock()
  98. defer v.accessLock.Unlock()
  99. stat, e := v.dataFile.Stat()
  100. if e == nil {
  101. return stat.Size()
  102. }
  103. log.Printf("Failed to read file size %s %s\n", v.dataFile.Name(), e.Error())
  104. return -1
  105. }
  106. func (v *Volume) Close() {
  107. v.accessLock.Lock()
  108. defer v.accessLock.Unlock()
  109. v.nm.Close()
  110. _ = v.dataFile.Close()
  111. }
  112. func (v *Volume) maybeWriteSuperBlock() error {
  113. stat, e := v.dataFile.Stat()
  114. if e != nil {
  115. log.Printf("failed to stat datafile %s: %s", v.dataFile, e)
  116. return e
  117. }
  118. if stat.Size() == 0 {
  119. v.SuperBlock.Version = CurrentVersion
  120. _, e = v.dataFile.Write(v.SuperBlock.Bytes())
  121. if e != nil && os.IsPermission(e) {
  122. //read-only, but zero length - recreate it!
  123. if v.dataFile, e = os.Create(v.dataFile.Name()); e == nil {
  124. if _, e = v.dataFile.Write(v.SuperBlock.Bytes()); e == nil {
  125. v.readOnly = false
  126. }
  127. }
  128. }
  129. }
  130. return e
  131. }
  132. func (v *Volume) readSuperBlock() (err error) {
  133. if _, err = v.dataFile.Seek(0, 0); err != nil {
  134. return fmt.Errorf("cannot seek to the beginning of %s: %s", v.dataFile, err)
  135. }
  136. header := make([]byte, SuperBlockSize)
  137. if _, e := v.dataFile.Read(header); e != nil {
  138. return fmt.Errorf("cannot read superblock: %s", e)
  139. }
  140. v.SuperBlock, err = ParseSuperBlock(header)
  141. return err
  142. }
  143. func ParseSuperBlock(header []byte) (superBlock SuperBlock, err error) {
  144. superBlock.Version = Version(header[0])
  145. if superBlock.ReplicaType, err = NewReplicationTypeFromByte(header[1]); err != nil {
  146. err = fmt.Errorf("cannot read replica type: %s", err)
  147. }
  148. return
  149. }
  150. func (v *Volume) NeedToReplicate() bool {
  151. return v.ReplicaType.GetCopyCount() > 1
  152. }
  153. func (v *Volume) isFileUnchanged(n *Needle) bool {
  154. nv, ok := v.nm.Get(n.Id)
  155. if ok && nv.Offset > 0 {
  156. if _, err := v.dataFile.Seek(int64(nv.Offset)*NeedlePaddingSize, 0); err != nil {
  157. return false
  158. }
  159. oldNeedle := new(Needle)
  160. oldNeedle.Read(v.dataFile, nv.Size, v.Version())
  161. if oldNeedle.Checksum == n.Checksum && bytes.Equal(oldNeedle.Data, n.Data) {
  162. n.Size = oldNeedle.Size
  163. return true
  164. }
  165. }
  166. return false
  167. }
  168. func (v *Volume) write(n *Needle) (size uint32, err error) {
  169. if v.readOnly {
  170. err = fmt.Errorf("%s is read-only", v.dataFile)
  171. return
  172. }
  173. v.accessLock.Lock()
  174. defer v.accessLock.Unlock()
  175. if v.isFileUnchanged(n) {
  176. size = n.Size
  177. return
  178. }
  179. var offset int64
  180. if offset, err = v.dataFile.Seek(0, 2); err != nil {
  181. return
  182. }
  183. //ensure file writing starting from aligned positions
  184. if offset%NeedlePaddingSize != 0 {
  185. offset = offset + (NeedlePaddingSize - offset%NeedlePaddingSize)
  186. if offset, err = v.dataFile.Seek(offset, 0); err != nil {
  187. return
  188. }
  189. }
  190. if size, err = n.Append(v.dataFile, v.Version()); err != nil {
  191. if e := v.dataFile.Truncate(offset); e != nil {
  192. err = fmt.Errorf("%s\ncannot truncate %s: %s", err, v.dataFile, e)
  193. }
  194. return
  195. }
  196. nv, ok := v.nm.Get(n.Id)
  197. if !ok || int64(nv.Offset)*NeedlePaddingSize < offset {
  198. _, err = v.nm.Put(n.Id, uint32(offset/NeedlePaddingSize), n.Size)
  199. }
  200. return
  201. }
  202. func (v *Volume) delete(n *Needle) (uint32, error) {
  203. if v.readOnly {
  204. return 0, fmt.Errorf("%s is read-only", v.dataFile)
  205. }
  206. v.accessLock.Lock()
  207. defer v.accessLock.Unlock()
  208. nv, ok := v.nm.Get(n.Id)
  209. //fmt.Println("key", n.Id, "volume offset", nv.Offset, "data_size", n.Size, "cached size", nv.Size)
  210. if ok {
  211. var err error
  212. size := nv.Size
  213. if err = v.nm.Delete(n.Id); err != nil {
  214. return size, err
  215. }
  216. if _, err = v.dataFile.Seek(0, 2); err != nil {
  217. return size, err
  218. }
  219. n.Data = make([]byte, 0)
  220. _, err = n.Append(v.dataFile, v.Version())
  221. return size, err
  222. }
  223. return 0, nil
  224. }
  225. func (v *Volume) read(n *Needle) (int, error) {
  226. v.accessLock.Lock()
  227. defer v.accessLock.Unlock()
  228. nv, ok := v.nm.Get(n.Id)
  229. if ok && nv.Offset > 0 {
  230. if _, err := v.dataFile.Seek(int64(nv.Offset)*NeedlePaddingSize, 0); err != nil {
  231. return -1, err
  232. }
  233. return n.Read(v.dataFile, nv.Size, v.Version())
  234. }
  235. return -1, errors.New("Not Found")
  236. }
  237. func (v *Volume) garbageLevel() float64 {
  238. return float64(v.nm.DeletedSize()) / float64(v.ContentSize())
  239. }
  240. func (v *Volume) compact() error {
  241. v.accessLock.Lock()
  242. defer v.accessLock.Unlock()
  243. filePath := path.Join(v.dir, v.Id.String())
  244. return v.copyDataAndGenerateIndexFile(filePath+".cpd", filePath+".cpx")
  245. }
  246. func (v *Volume) commitCompact() error {
  247. v.accessLock.Lock()
  248. defer v.accessLock.Unlock()
  249. _ = v.dataFile.Close()
  250. var e error
  251. if e = os.Rename(path.Join(v.dir, v.Id.String()+".cpd"), path.Join(v.dir, v.Id.String()+".dat")); e != nil {
  252. return e
  253. }
  254. if e = os.Rename(path.Join(v.dir, v.Id.String()+".cpx"), path.Join(v.dir, v.Id.String()+".idx")); e != nil {
  255. return e
  256. }
  257. if e = v.load(true); e != nil {
  258. return e
  259. }
  260. return nil
  261. }
  262. func (v *Volume) freeze() error {
  263. if v.readOnly {
  264. return nil
  265. }
  266. nm, ok := v.nm.(*NeedleMap)
  267. if !ok {
  268. return nil
  269. }
  270. v.accessLock.Lock()
  271. defer v.accessLock.Unlock()
  272. bn, _ := nakeFilename(v.dataFile.Name())
  273. cdbFn := bn + ".cdb"
  274. log.Printf("converting %s to %s", nm.indexFile.Name(), cdbFn)
  275. err := DumpNeedleMapToCdb(cdbFn, nm)
  276. if err != nil {
  277. return err
  278. }
  279. if v.nm, err = OpenCdbMap(cdbFn); err != nil {
  280. return err
  281. }
  282. nm.indexFile.Close()
  283. os.Remove(nm.indexFile.Name())
  284. v.readOnly = true
  285. return nil
  286. }
  287. func ScanVolumeFile(dirname string, id VolumeId,
  288. visitSuperBlock func(SuperBlock) error,
  289. visitNeedle func(n *Needle, offset uint32) error) (err error) {
  290. var v *Volume
  291. if v, err = LoadVolumeOnly(dirname, id); err != nil {
  292. return
  293. }
  294. if err = visitSuperBlock(v.SuperBlock); err != nil {
  295. return
  296. }
  297. version := v.Version()
  298. offset := uint32(SuperBlockSize)
  299. n, rest, e := ReadNeedleHeader(v.dataFile, version)
  300. if e != nil {
  301. err = fmt.Errorf("cannot read needle header: %s", e)
  302. return
  303. }
  304. for n != nil {
  305. if err = n.ReadNeedleBody(v.dataFile, version, rest); err != nil {
  306. err = fmt.Errorf("cannot read needle body: %s", err)
  307. return
  308. }
  309. if err = visitNeedle(n, offset); err != nil {
  310. return
  311. }
  312. offset += NeedleHeaderSize + rest
  313. if n, rest, err = ReadNeedleHeader(v.dataFile, version); err != nil {
  314. if err == io.EOF {
  315. return nil
  316. }
  317. return fmt.Errorf("cannot read needle header: %s", err)
  318. }
  319. }
  320. return
  321. }
  322. func (v *Volume) copyDataAndGenerateIndexFile(dstName, idxName string) (err error) {
  323. var (
  324. dst, idx *os.File
  325. )
  326. if dst, err = os.OpenFile(dstName, os.O_WRONLY|os.O_CREATE, 0644); err != nil {
  327. return
  328. }
  329. defer dst.Close()
  330. if idx, err = os.OpenFile(idxName, os.O_WRONLY|os.O_CREATE, 0644); err != nil {
  331. return
  332. }
  333. defer idx.Close()
  334. nm := NewNeedleMap(idx)
  335. new_offset := uint32(SuperBlockSize)
  336. err = ScanVolumeFile(v.dir, v.Id, func(superBlock SuperBlock) error {
  337. _, err = dst.Write(superBlock.Bytes())
  338. return err
  339. }, func(n *Needle, offset uint32) error {
  340. nv, ok := v.nm.Get(n.Id)
  341. //log.Println("file size is", n.Size, "rest", rest)
  342. if ok && nv.Offset*NeedlePaddingSize == offset {
  343. if nv.Size > 0 {
  344. if _, err = nm.Put(n.Id, new_offset/NeedlePaddingSize, n.Size); err != nil {
  345. return fmt.Errorf("cannot put needle: %s", err)
  346. }
  347. if _, err = n.Append(dst, v.Version()); err != nil {
  348. return fmt.Errorf("cannot append needle: %s", err)
  349. }
  350. new_offset += n.DiskSize()
  351. //log.Println("saving key", n.Id, "volume offset", old_offset, "=>", new_offset, "data_size", n.Size, "rest", rest)
  352. }
  353. }
  354. return nil
  355. })
  356. return
  357. }
  358. func (v *Volume) ContentSize() uint64 {
  359. return v.nm.ContentSize()
  360. }