Browse Source
add leveldb support for needle map
add leveldb support for needle map
This supposedly should reduce memory consumption. However, for tests with millions of, this shows consuming more memories. Need to see whether this will work out. If not, later boltdb will be tested.pull/114/head
13 changed files with 347 additions and 253 deletions
-
158go/storage/needle_map.go
-
151go/storage/needle_map_leveldb.go
-
126go/storage/needle_map_memory.go
-
40go/storage/store.go
-
83go/storage/volume.go
-
4go/storage/volume_vacuum.go
-
4go/util/http_util.go
-
2go/weed/compact.go
-
4go/weed/fix.go
-
2go/weed/server.go
-
3go/weed/volume.go
-
10go/weed/weed_server/volume_server.go
-
13go/weed/weed_server/volume_server_handlers_admin.go
@ -0,0 +1,151 @@ |
|||||
|
package storage |
||||
|
|
||||
|
import ( |
||||
|
"fmt" |
||||
|
"os" |
||||
|
"path/filepath" |
||||
|
|
||||
|
"github.com/chrislusf/weed-fs/go/glog" |
||||
|
"github.com/chrislusf/weed-fs/go/util" |
||||
|
"github.com/syndtr/goleveldb/leveldb" |
||||
|
) |
||||
|
|
||||
|
type LevelDbNeedleMap struct { |
||||
|
dbFileName string |
||||
|
indexFile *os.File |
||||
|
db *leveldb.DB |
||||
|
mapMetric |
||||
|
} |
||||
|
|
||||
|
func NewLevelDbNeedleMap(dbFileName string, indexFile *os.File) (m *LevelDbNeedleMap, err error) { |
||||
|
m = &LevelDbNeedleMap{indexFile: indexFile, dbFileName: dbFileName} |
||||
|
if !isLevelDbFresh(dbFileName, indexFile) { |
||||
|
glog.V(1).Infof("Start to Generate %s from %s", dbFileName, indexFile.Name()) |
||||
|
generateDbFile(dbFileName, indexFile) |
||||
|
glog.V(1).Infof("Finished Generating %s from %s", dbFileName, indexFile.Name()) |
||||
|
} |
||||
|
glog.V(1).Infof("Opening %s...", dbFileName) |
||||
|
if m.db, err = leveldb.OpenFile(dbFileName, nil); err != nil { |
||||
|
return |
||||
|
} |
||||
|
glog.V(1).Infof("Loading %s...", indexFile.Name()) |
||||
|
nm, indexLoadError := LoadNeedleMap(indexFile) |
||||
|
if indexLoadError != nil { |
||||
|
return nil, indexLoadError |
||||
|
} |
||||
|
m.mapMetric = nm.mapMetric |
||||
|
return |
||||
|
} |
||||
|
|
||||
|
func isLevelDbFresh(dbFileName string, indexFile *os.File) bool { |
||||
|
// normally we always write to index file first
|
||||
|
dbLogFile, err := os.Open(filepath.Join(dbFileName, "LOG")) |
||||
|
if err != nil { |
||||
|
return false |
||||
|
} |
||||
|
defer dbLogFile.Close() |
||||
|
dbStat, dbStatErr := dbLogFile.Stat() |
||||
|
indexStat, indexStatErr := indexFile.Stat() |
||||
|
if dbStatErr != nil || indexStatErr != nil { |
||||
|
glog.V(0).Infof("Can not stat file: %v and %v", dbStatErr, indexStatErr) |
||||
|
return false |
||||
|
} |
||||
|
|
||||
|
return dbStat.ModTime().After(indexStat.ModTime()) |
||||
|
} |
||||
|
|
||||
|
func generateDbFile(dbFileName string, indexFile *os.File) error { |
||||
|
db, err := leveldb.OpenFile(dbFileName, nil) |
||||
|
if err != nil { |
||||
|
return err |
||||
|
} |
||||
|
defer db.Close() |
||||
|
return WalkIndexFile(indexFile, func(key uint64, offset, size uint32) error { |
||||
|
if offset > 0 { |
||||
|
levelDbWrite(db, key, offset, size) |
||||
|
} else { |
||||
|
levelDbDelete(db, key) |
||||
|
} |
||||
|
return nil |
||||
|
}) |
||||
|
} |
||||
|
|
||||
|
func (m *LevelDbNeedleMap) Get(key uint64) (element *NeedleValue, ok bool) { |
||||
|
bytes := make([]byte, 8) |
||||
|
util.Uint64toBytes(bytes, key) |
||||
|
data, err := m.db.Get(bytes, nil) |
||||
|
if err != nil || len(data) != 8 { |
||||
|
glog.V(0).Infof("Failed to get %d %v", key, err) |
||||
|
return nil, false |
||||
|
} |
||||
|
offset := util.BytesToUint32(data[0:4]) |
||||
|
size := util.BytesToUint32(data[4:8]) |
||||
|
return &NeedleValue{Key: Key(key), Offset: offset, Size: size}, true |
||||
|
} |
||||
|
|
||||
|
func (m *LevelDbNeedleMap) Put(key uint64, offset uint32, size uint32) error { |
||||
|
var oldSize uint32 |
||||
|
if oldNeedle, ok := m.Get(key); ok { |
||||
|
oldSize = oldNeedle.Size |
||||
|
} |
||||
|
m.logPut(key, oldSize, size) |
||||
|
// write to index file first
|
||||
|
if err := appendToIndexFile(m.indexFile, key, offset, size); err != nil { |
||||
|
return fmt.Errorf("cannot write to indexfile %s: %v", m.indexFile.Name(), err) |
||||
|
} |
||||
|
return levelDbWrite(m.db, key, offset, size) |
||||
|
} |
||||
|
|
||||
|
func levelDbWrite(db *leveldb.DB, |
||||
|
key uint64, offset uint32, size uint32) error { |
||||
|
bytes := make([]byte, 16) |
||||
|
util.Uint64toBytes(bytes[0:8], key) |
||||
|
util.Uint32toBytes(bytes[8:12], offset) |
||||
|
util.Uint32toBytes(bytes[12:16], size) |
||||
|
if err := db.Put(bytes[0:8], bytes[8:16], nil); err != nil { |
||||
|
return fmt.Errorf("failed to write leveldb: %v", err) |
||||
|
} |
||||
|
return nil |
||||
|
} |
||||
|
func levelDbDelete(db *leveldb.DB, key uint64) error { |
||||
|
bytes := make([]byte, 8) |
||||
|
util.Uint64toBytes(bytes, key) |
||||
|
return db.Delete(bytes, nil) |
||||
|
} |
||||
|
|
||||
|
func (m *LevelDbNeedleMap) Delete(key uint64) error { |
||||
|
if oldNeedle, ok := m.Get(key); ok { |
||||
|
m.logDelete(oldNeedle.Size) |
||||
|
} |
||||
|
// write to index file first
|
||||
|
if err := appendToIndexFile(m.indexFile, key, 0, 0); err != nil { |
||||
|
return err |
||||
|
} |
||||
|
return levelDbDelete(m.db, key) |
||||
|
} |
||||
|
|
||||
|
func (m *LevelDbNeedleMap) Close() { |
||||
|
m.db.Close() |
||||
|
} |
||||
|
|
||||
|
func (m *LevelDbNeedleMap) Destroy() error { |
||||
|
m.Close() |
||||
|
os.Remove(m.indexFile.Name()) |
||||
|
return os.Remove(m.dbFileName) |
||||
|
} |
||||
|
|
||||
|
func (m *LevelDbNeedleMap) ContentSize() uint64 { |
||||
|
return m.FileByteCounter |
||||
|
} |
||||
|
func (m *LevelDbNeedleMap) DeletedSize() uint64 { |
||||
|
return m.DeletionByteCounter |
||||
|
} |
||||
|
func (m *LevelDbNeedleMap) FileCount() int { |
||||
|
return m.FileCounter |
||||
|
} |
||||
|
func (m *LevelDbNeedleMap) DeletedCount() int { |
||||
|
return m.DeletionCounter |
||||
|
} |
||||
|
func (m *LevelDbNeedleMap) MaxFileKey() uint64 { |
||||
|
return m.MaximumFileKey |
||||
|
} |
@ -0,0 +1,126 @@ |
|||||
|
package storage |
||||
|
|
||||
|
import ( |
||||
|
"io" |
||||
|
"os" |
||||
|
|
||||
|
"github.com/chrislusf/weed-fs/go/glog" |
||||
|
"github.com/chrislusf/weed-fs/go/util" |
||||
|
) |
||||
|
|
||||
|
type NeedleMap struct { |
||||
|
indexFile *os.File |
||||
|
m CompactMap |
||||
|
|
||||
|
mapMetric |
||||
|
} |
||||
|
|
||||
|
func NewNeedleMap(file *os.File) *NeedleMap { |
||||
|
nm := &NeedleMap{ |
||||
|
m: NewCompactMap(), |
||||
|
indexFile: file, |
||||
|
} |
||||
|
return nm |
||||
|
} |
||||
|
|
||||
|
const ( |
||||
|
RowsToRead = 1024 |
||||
|
) |
||||
|
|
||||
|
func LoadNeedleMap(file *os.File) (*NeedleMap, error) { |
||||
|
nm := NewNeedleMap(file) |
||||
|
e := WalkIndexFile(file, func(key uint64, offset, size uint32) error { |
||||
|
if key > nm.MaximumFileKey { |
||||
|
nm.MaximumFileKey = key |
||||
|
} |
||||
|
nm.FileCounter++ |
||||
|
nm.FileByteCounter = nm.FileByteCounter + uint64(size) |
||||
|
if offset > 0 { |
||||
|
oldSize := nm.m.Set(Key(key), offset, size) |
||||
|
glog.V(3).Infoln("reading key", key, "offset", offset*NeedlePaddingSize, "size", size, "oldSize", oldSize) |
||||
|
if oldSize > 0 { |
||||
|
nm.DeletionCounter++ |
||||
|
nm.DeletionByteCounter = nm.DeletionByteCounter + uint64(oldSize) |
||||
|
} |
||||
|
} else { |
||||
|
oldSize := nm.m.Delete(Key(key)) |
||||
|
glog.V(3).Infoln("removing key", key, "offset", offset*NeedlePaddingSize, "size", size, "oldSize", oldSize) |
||||
|
nm.DeletionCounter++ |
||||
|
nm.DeletionByteCounter = nm.DeletionByteCounter + uint64(oldSize) |
||||
|
} |
||||
|
return nil |
||||
|
}) |
||||
|
glog.V(1).Infoln("max file key:", nm.MaximumFileKey) |
||||
|
return nm, e |
||||
|
} |
||||
|
|
||||
|
// walks through the index file, calls fn function with each key, offset, size
|
||||
|
// stops with the error returned by the fn function
|
||||
|
func WalkIndexFile(r *os.File, fn func(key uint64, offset, size uint32) error) error { |
||||
|
var readerOffset int64 |
||||
|
bytes := make([]byte, 16*RowsToRead) |
||||
|
count, e := r.ReadAt(bytes, readerOffset) |
||||
|
glog.V(3).Infoln("file", r.Name(), "readerOffset", readerOffset, "count", count, "e", e) |
||||
|
readerOffset += int64(count) |
||||
|
var ( |
||||
|
key uint64 |
||||
|
offset, size uint32 |
||||
|
i int |
||||
|
) |
||||
|
|
||||
|
for count > 0 && e == nil || e == io.EOF { |
||||
|
for i = 0; i+16 <= count; i += 16 { |
||||
|
key = util.BytesToUint64(bytes[i : i+8]) |
||||
|
offset = util.BytesToUint32(bytes[i+8 : i+12]) |
||||
|
size = util.BytesToUint32(bytes[i+12 : i+16]) |
||||
|
if e = fn(key, offset, size); e != nil { |
||||
|
return e |
||||
|
} |
||||
|
} |
||||
|
if e == io.EOF { |
||||
|
return nil |
||||
|
} |
||||
|
count, e = r.ReadAt(bytes, readerOffset) |
||||
|
glog.V(3).Infoln("file", r.Name(), "readerOffset", readerOffset, "count", count, "e", e) |
||||
|
readerOffset += int64(count) |
||||
|
} |
||||
|
return e |
||||
|
} |
||||
|
|
||||
|
func (nm *NeedleMap) Put(key uint64, offset uint32, size uint32) error { |
||||
|
oldSize := nm.m.Set(Key(key), offset, size) |
||||
|
nm.logPut(key, oldSize, size) |
||||
|
return appendToIndexFile(nm.indexFile, key, offset, size) |
||||
|
} |
||||
|
func (nm *NeedleMap) Get(key uint64) (element *NeedleValue, ok bool) { |
||||
|
element, ok = nm.m.Get(Key(key)) |
||||
|
return |
||||
|
} |
||||
|
func (nm *NeedleMap) Delete(key uint64) error { |
||||
|
deletedBytes := nm.m.Delete(Key(key)) |
||||
|
nm.logDelete(deletedBytes) |
||||
|
return appendToIndexFile(nm.indexFile, key, 0, 0) |
||||
|
} |
||||
|
func (nm *NeedleMap) Close() { |
||||
|
_ = nm.indexFile.Close() |
||||
|
} |
||||
|
func (nm *NeedleMap) Destroy() error { |
||||
|
nm.Close() |
||||
|
return os.Remove(nm.indexFile.Name()) |
||||
|
} |
||||
|
func (nm NeedleMap) ContentSize() uint64 { |
||||
|
return nm.FileByteCounter |
||||
|
} |
||||
|
func (nm NeedleMap) DeletedSize() uint64 { |
||||
|
return nm.DeletionByteCounter |
||||
|
} |
||||
|
func (nm NeedleMap) FileCount() int { |
||||
|
return nm.FileCounter |
||||
|
} |
||||
|
func (nm NeedleMap) DeletedCount() int { |
||||
|
return nm.DeletionCounter |
||||
|
} |
||||
|
|
||||
|
func (nm NeedleMap) MaxFileKey() uint64 { |
||||
|
return nm.MaximumFileKey |
||||
|
} |
Write
Preview
Loading…
Cancel
Save
Reference in new issue