Browse Source
Fix LevelDB panic on lazy reload (#8269) (#8307)
Fix LevelDB panic on lazy reload (#8269) (#8307)
* fix LevelDB panic on lazy reload Implemented a thread-safe reload mechanism using double-checked locking and a retry loop in Get, Put, and Delete. Added a concurrency test to verify the fix and prevent regressions. Fixes #8269 * refactor: use helper for leveldb fix and remove deprecated ioutil * fix: prevent deadlock by using getFromDb helper Extracted DB lookup to internal helper to avoid recursive RLock in Put/Delete methods. Updated Get to use the helper as well. * fix: resolve syntax error and commit deadlock prevention Fixed a duplicate function declaration syntax error. Verified that getFromDb helper correctly prevents recursive RLock scenarios. * refactor: remove redundant timeout checks Removed nested `if m.ldbTimeout > 0` checks in Get, Put, and Delete methods as suggested in PR review.pull/8323/head
committed by
GitHub
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
2 changed files with 123 additions and 17 deletions
@ -0,0 +1,90 @@ |
|||
package storage |
|||
|
|||
import ( |
|||
"fmt" |
|||
"os" |
|||
"path/filepath" |
|||
"sync" |
|||
"testing" |
|||
|
|||
"github.com/seaweedfs/seaweedfs/weed/storage/types" |
|||
) |
|||
|
|||
func TestLevelDbNeedleMap_Concurrency(t *testing.T) { |
|||
dir, err := os.MkdirTemp("", "test_leveldb_concurrency") |
|||
if err != nil { |
|||
t.Fatalf("temp dir: %v", err) |
|||
} |
|||
defer os.RemoveAll(dir) |
|||
|
|||
prefix := "test" |
|||
indexFile, err := os.Create(filepath.Join(dir, prefix+".idx")) |
|||
if err != nil { |
|||
t.Fatalf("create index file: %v", err) |
|||
} |
|||
dbFileName := filepath.Join(dir, prefix+".ldb") |
|||
|
|||
// Create and initialize map
|
|||
m, err := NewLevelDbNeedleMap(dbFileName, indexFile, nil, 1) |
|||
if err != nil { |
|||
t.Fatalf("NewLevelDbNeedleMap: %v", err) |
|||
} |
|||
defer m.Close() |
|||
|
|||
// Pre-populate some data
|
|||
key := types.NeedleId(1) |
|||
if err := m.Put(key, types.ToOffset(100), types.Size(200)); err != nil { |
|||
t.Fatalf("Put: %v", err) |
|||
} |
|||
|
|||
// Force unload to start from nil state
|
|||
if err := unloadLdb(m); err != nil { |
|||
t.Fatalf("unloadLdb: %v", err) |
|||
} |
|||
|
|||
var wg sync.WaitGroup |
|||
startCh := make(chan struct{}) |
|||
errCh := make(chan error, 100) |
|||
|
|||
// Spawn multiple goroutines to trigger the race
|
|||
// Multiple readers will see m.db == nil and try to reload concurrently
|
|||
for i := 0; i < 2; i++ { |
|||
wg.Add(1) |
|||
go func(id int) { |
|||
defer wg.Done() |
|||
<-startCh |
|||
|
|||
// Try multiple times to increase chance of collision
|
|||
for j := 0; j < 2; j++ { |
|||
_, ok := m.Get(key) |
|||
if !ok { |
|||
// Get failed, possibly due to race in reload.
|
|||
// But we also put data concurrently, so maybe it's missing if deleted?
|
|||
// In this test, we only Put, never Delete. So Key 1 should be there.
|
|||
// However, if DB reload fails, Get returns false!
|
|||
errCh <- fmt.Errorf("routine %d iter %d: Get returned false", id, j) |
|||
} |
|||
|
|||
// Also try Put concurrently
|
|||
err := m.Put(types.NeedleId(2+id), types.ToOffset(100), types.Size(200)) |
|||
if err != nil { |
|||
errCh <- fmt.Errorf("routine %d iter %d: Put failed: %v", id, j, err) |
|||
} |
|||
|
|||
// Manually unload occasionally to reset the state
|
|||
if j%2 == 0 { |
|||
// This might fail if locked, but that's fine
|
|||
unloadLdb(m) |
|||
} |
|||
} |
|||
}(i) |
|||
} |
|||
|
|||
close(startCh) |
|||
wg.Wait() |
|||
close(errCh) |
|||
|
|||
for e := range errCh { |
|||
t.Errorf("Error encountered: %v", e) |
|||
} |
|||
} |
|||
Write
Preview
Loading…
Cancel
Save
Reference in new issue