You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

389 lines
9.8 KiB

12 years ago
12 years ago
12 years ago
12 years ago
  1. package storage
  2. import (
  3. "errors"
  4. "fmt"
  5. "io"
  6. "log"
  7. "os"
  8. "path"
  9. "sync"
  10. )
  11. const (
  12. SuperBlockSize = 8
  13. )
  14. type SuperBlock struct {
  15. Version Version
  16. ReplicaType ReplicationType
  17. }
  18. func (s *SuperBlock) Bytes() []byte {
  19. header := make([]byte, SuperBlockSize)
  20. header[0] = byte(s.Version)
  21. header[1] = s.ReplicaType.Byte()
  22. return header
  23. }
  24. type Volume struct {
  25. Id VolumeId
  26. dir string
  27. dataFile *os.File
  28. nm NeedleMapper
  29. readOnly bool
  30. SuperBlock
  31. accessLock sync.Mutex
  32. }
  33. func NewVolume(dirname string, id VolumeId, replicationType ReplicationType) (v *Volume, e error) {
  34. v = &Volume{dir: dirname, Id: id}
  35. v.SuperBlock = SuperBlock{ReplicaType: replicationType}
  36. e = v.load(true)
  37. return
  38. }
  39. func LoadVolumeOnly(dirname string, id VolumeId) (v *Volume, e error) {
  40. v = &Volume{dir: dirname, Id: id}
  41. v.SuperBlock = SuperBlock{ReplicaType: CopyNil}
  42. e = v.load(false)
  43. return
  44. }
  45. func (v *Volume) load(alsoLoadIndex bool) error {
  46. var e error
  47. fileName := path.Join(v.dir, v.Id.String())
  48. v.dataFile, e = os.OpenFile(fileName+".dat", os.O_RDWR|os.O_CREATE, 0644)
  49. if e != nil {
  50. if !os.IsPermission(e) {
  51. return fmt.Errorf("cannot create Volume Data %s.dat: %s", fileName, e)
  52. }
  53. if v.dataFile, e = os.Open(fileName + ".dat"); e != nil {
  54. return fmt.Errorf("cannot open Volume Data %s.dat: %s", fileName, e)
  55. }
  56. log.Printf("opening " + fileName + ".dat in READONLY mode")
  57. v.readOnly = true
  58. }
  59. if v.ReplicaType == CopyNil {
  60. e = v.readSuperBlock()
  61. } else {
  62. e = v.maybeWriteSuperBlock()
  63. }
  64. if e == nil && alsoLoadIndex {
  65. var indexFile *os.File
  66. if v.readOnly {
  67. if indexFile, e = os.Open(fileName + ".idx"); e != nil && !os.IsNotExist(e) {
  68. return fmt.Errorf("cannot open index file %s.idx: %s", fileName, e)
  69. }
  70. if indexFile != nil {
  71. log.Printf("converting %s.idx to %s.cdb", fileName, fileName)
  72. if e = ConvertIndexToCdb(fileName+".cdb", indexFile); e != nil {
  73. log.Printf("error converting %s.idx to %s.cdb: %s", fileName, fileName)
  74. } else {
  75. indexFile.Close()
  76. os.Remove(indexFile.Name())
  77. indexFile = nil
  78. }
  79. }
  80. v.nm, e = OpenCdbMap(fileName + ".cdb")
  81. return e
  82. } else {
  83. indexFile, e = os.OpenFile(fileName+".idx", os.O_RDWR|os.O_CREATE, 0644)
  84. if e != nil {
  85. return fmt.Errorf("cannot create Volume Data %s.dat: %s", fileName, e)
  86. }
  87. }
  88. v.nm, e = LoadNeedleMap(indexFile)
  89. }
  90. return e
  91. }
  92. func (v *Volume) Version() Version {
  93. return v.SuperBlock.Version
  94. }
  95. func (v *Volume) Size() int64 {
  96. v.accessLock.Lock()
  97. defer v.accessLock.Unlock()
  98. stat, e := v.dataFile.Stat()
  99. if e == nil {
  100. return stat.Size()
  101. }
  102. fmt.Printf("Failed to read file size %s %s\n", v.dataFile.Name(), e.Error())
  103. return -1
  104. }
  105. func (v *Volume) Close() {
  106. v.accessLock.Lock()
  107. defer v.accessLock.Unlock()
  108. v.nm.Close()
  109. _ = v.dataFile.Close()
  110. }
  111. func (v *Volume) maybeWriteSuperBlock() error {
  112. stat, e := v.dataFile.Stat()
  113. if e != nil {
  114. fmt.Printf("failed to stat datafile %s: %s", v.dataFile, e)
  115. return e
  116. }
  117. if stat.Size() == 0 {
  118. v.SuperBlock.Version = CurrentVersion
  119. _, e = v.dataFile.Write(v.SuperBlock.Bytes())
  120. if e != nil && os.IsPermission(e) {
  121. //read-only, but zero length - recreate it!
  122. if v.dataFile, e = os.Create(v.dataFile.Name()); e == nil {
  123. if _, e = v.dataFile.Write(v.SuperBlock.Bytes()); e == nil {
  124. v.readOnly = false
  125. }
  126. }
  127. }
  128. }
  129. return e
  130. }
  131. func (v *Volume) readSuperBlock() (err error) {
  132. if _, err = v.dataFile.Seek(0, 0); err != nil {
  133. return fmt.Errorf("cannot seek to the beginning of %s: %s", v.dataFile, err)
  134. }
  135. header := make([]byte, SuperBlockSize)
  136. if _, e := v.dataFile.Read(header); e != nil {
  137. return fmt.Errorf("cannot read superblock: %s", e)
  138. }
  139. v.SuperBlock, err = ParseSuperBlock(header)
  140. return err
  141. }
  142. func ParseSuperBlock(header []byte) (superBlock SuperBlock, err error) {
  143. superBlock.Version = Version(header[0])
  144. if superBlock.ReplicaType, err = NewReplicationTypeFromByte(header[1]); err != nil {
  145. err = fmt.Errorf("cannot read replica type: %s", err)
  146. }
  147. return
  148. }
  149. func (v *Volume) NeedToReplicate() bool {
  150. return v.ReplicaType.GetCopyCount() > 1
  151. }
  152. func (v *Volume) isFileUnchanged(n *Needle) bool {
  153. nv, ok := v.nm.Get(n.Id)
  154. if ok && nv.Offset > 0 {
  155. if _, err := v.dataFile.Seek(int64(nv.Offset)*NeedlePaddingSize, 0); err != nil {
  156. return false
  157. }
  158. oldNeedle := new(Needle)
  159. oldNeedle.Read(v.dataFile, nv.Size, v.Version())
  160. if len(oldNeedle.Data) == len(n.Data) && oldNeedle.Checksum == n.Checksum {
  161. length := len(n.Data)
  162. for i := 0; i < length; i++ {
  163. if n.Data[i] != oldNeedle.Data[i] {
  164. return false
  165. }
  166. }
  167. n.Size = oldNeedle.Size
  168. return true
  169. }
  170. }
  171. return false
  172. }
  173. func (v *Volume) write(n *Needle) (size uint32, err error) {
  174. if v.readOnly {
  175. err = fmt.Errorf("%s is read-only", v.dataFile)
  176. return
  177. }
  178. v.accessLock.Lock()
  179. defer v.accessLock.Unlock()
  180. if v.isFileUnchanged(n) {
  181. size = n.Size
  182. return
  183. }
  184. var offset int64
  185. if offset, err = v.dataFile.Seek(0, 2); err != nil {
  186. return
  187. }
  188. //ensure file writing starting from aligned positions
  189. if offset%NeedlePaddingSize != 0 {
  190. offset = offset + (NeedlePaddingSize - offset%NeedlePaddingSize)
  191. if offset, err = v.dataFile.Seek(offset, 0); err != nil {
  192. return
  193. }
  194. }
  195. if size, err = n.Append(v.dataFile, v.Version()); err != nil {
  196. if e := v.dataFile.Truncate(offset); e != nil {
  197. err = fmt.Errorf("%s\ncannot truncate %s: %s", err, v.dataFile, e)
  198. }
  199. return
  200. }
  201. nv, ok := v.nm.Get(n.Id)
  202. if !ok || int64(nv.Offset)*NeedlePaddingSize < offset {
  203. _, err = v.nm.Put(n.Id, uint32(offset/NeedlePaddingSize), n.Size)
  204. }
  205. return
  206. }
  207. func (v *Volume) delete(n *Needle) (uint32, error) {
  208. if v.readOnly {
  209. return 0, fmt.Errorf("%s is read-only", v.dataFile)
  210. }
  211. v.accessLock.Lock()
  212. defer v.accessLock.Unlock()
  213. nv, ok := v.nm.Get(n.Id)
  214. //fmt.Println("key", n.Id, "volume offset", nv.Offset, "data_size", n.Size, "cached size", nv.Size)
  215. if ok {
  216. var err error
  217. if err = v.nm.Delete(n.Id); err != nil {
  218. return nv.Size, err
  219. }
  220. if _, err = v.dataFile.Seek(int64(nv.Offset*NeedlePaddingSize), 0); err != nil {
  221. return nv.Size, err
  222. }
  223. n.Data = make([]byte,0)
  224. _, err = n.Append(v.dataFile, v.Version())
  225. return nv.Size, err
  226. }
  227. return 0, nil
  228. }
  229. func (v *Volume) read(n *Needle) (int, error) {
  230. v.accessLock.Lock()
  231. defer v.accessLock.Unlock()
  232. nv, ok := v.nm.Get(n.Id)
  233. if ok && nv.Offset > 0 {
  234. if _, err := v.dataFile.Seek(int64(nv.Offset)*NeedlePaddingSize, 0); err != nil {
  235. return -1, err
  236. }
  237. return n.Read(v.dataFile, nv.Size, v.Version())
  238. }
  239. return -1, errors.New("Not Found")
  240. }
  241. func (v *Volume) garbageLevel() float64 {
  242. return float64(v.nm.DeletedSize()) / float64(v.ContentSize())
  243. }
  244. func (v *Volume) compact() error {
  245. v.accessLock.Lock()
  246. defer v.accessLock.Unlock()
  247. filePath := path.Join(v.dir, v.Id.String())
  248. return v.copyDataAndGenerateIndexFile(filePath+".cpd", filePath+".cpx")
  249. }
  250. func (v *Volume) commitCompact() error {
  251. v.accessLock.Lock()
  252. defer v.accessLock.Unlock()
  253. _ = v.dataFile.Close()
  254. var e error
  255. if e = os.Rename(path.Join(v.dir, v.Id.String()+".cpd"), path.Join(v.dir, v.Id.String()+".dat")); e != nil {
  256. return e
  257. }
  258. if e = os.Rename(path.Join(v.dir, v.Id.String()+".cpx"), path.Join(v.dir, v.Id.String()+".idx")); e != nil {
  259. return e
  260. }
  261. if e = v.load(true); e != nil {
  262. return e
  263. }
  264. return nil
  265. }
  266. func (v *Volume) freeze() error {
  267. if v.readOnly {
  268. return nil
  269. }
  270. nm, ok := v.nm.(*NeedleMap)
  271. if !ok {
  272. return nil
  273. }
  274. v.accessLock.Lock()
  275. defer v.accessLock.Unlock()
  276. bn, _ := nakeFilename(v.dataFile.Name())
  277. cdbFn := bn + ".cdb"
  278. log.Printf("converting %s to %s", nm.indexFile.Name(), cdbFn)
  279. err := DumpNeedleMapToCdb(cdbFn, nm)
  280. if err != nil {
  281. return err
  282. }
  283. if v.nm, err = OpenCdbMap(cdbFn); err != nil {
  284. return err
  285. }
  286. nm.indexFile.Close()
  287. os.Remove(nm.indexFile.Name())
  288. v.readOnly = true
  289. return nil
  290. }
  291. func ScanVolumeFile(dirname string, id VolumeId,
  292. visitSuperBlock func(SuperBlock) error,
  293. visitNeedle func(n *Needle, offset uint32) error) (err error) {
  294. var v *Volume
  295. if v, err = LoadVolumeOnly(dirname, id); err != nil {
  296. return
  297. }
  298. if err = visitSuperBlock(v.SuperBlock); err != nil {
  299. return
  300. }
  301. version := v.Version()
  302. offset := uint32(SuperBlockSize)
  303. n, rest, e := ReadNeedleHeader(v.dataFile, version)
  304. if e != nil {
  305. err = fmt.Errorf("cannot read needle header: %s", e)
  306. return
  307. }
  308. for n != nil {
  309. if err = n.ReadNeedleBody(v.dataFile, version, rest); err != nil {
  310. err = fmt.Errorf("cannot read needle body: %s", err)
  311. return
  312. }
  313. if err = visitNeedle(n, offset); err != nil {
  314. return
  315. }
  316. offset += NeedleHeaderSize + rest
  317. if n, rest, err = ReadNeedleHeader(v.dataFile, version); err != nil {
  318. if err == io.EOF {
  319. return nil
  320. }
  321. return fmt.Errorf("cannot read needle header: %s", err)
  322. }
  323. }
  324. return
  325. }
  326. func (v *Volume) copyDataAndGenerateIndexFile(dstName, idxName string) (err error) {
  327. var (
  328. dst, idx *os.File
  329. )
  330. if dst, err = os.OpenFile(dstName, os.O_WRONLY|os.O_CREATE, 0644); err != nil {
  331. return
  332. }
  333. defer dst.Close()
  334. if idx, err = os.OpenFile(idxName, os.O_WRONLY|os.O_CREATE, 0644); err != nil {
  335. return
  336. }
  337. defer idx.Close()
  338. nm := NewNeedleMap(idx)
  339. new_offset := uint32(SuperBlockSize)
  340. err = ScanVolumeFile(v.dir, v.Id, func(superBlock SuperBlock) error {
  341. _, err = dst.Write(superBlock.Bytes())
  342. return err
  343. }, func(n *Needle, offset uint32) error {
  344. nv, ok := v.nm.Get(n.Id)
  345. //log.Println("file size is", n.Size, "rest", rest)
  346. if ok && nv.Offset*NeedlePaddingSize == offset {
  347. if nv.Size > 0 {
  348. if _, err = nm.Put(n.Id, new_offset/NeedlePaddingSize, n.Size); err != nil {
  349. return fmt.Errorf("cannot put needle: %s", err)
  350. }
  351. if _, err = n.Append(dst, v.Version()); err != nil {
  352. return fmt.Errorf("cannot append needle: %s", err)
  353. }
  354. new_offset += n.DiskSize()
  355. //log.Println("saving key", n.Id, "volume offset", old_offset, "=>", new_offset, "data_size", n.Size, "rest", rest)
  356. }
  357. }
  358. return nil
  359. })
  360. return
  361. }
  362. func (v *Volume) ContentSize() uint64 {
  363. return v.nm.ContentSize()
  364. }