You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
234 lines
7.7 KiB
234 lines
7.7 KiB
package command
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
|
|
"google.golang.org/grpc"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/pb"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/security"
|
|
"github.com/seaweedfs/seaweedfs/weed/storage/needle"
|
|
"github.com/seaweedfs/seaweedfs/weed/storage/super_block"
|
|
"github.com/seaweedfs/seaweedfs/weed/util"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/operation"
|
|
"github.com/seaweedfs/seaweedfs/weed/storage"
|
|
)
|
|
|
|
var (
|
|
s BackupOptions
|
|
)
|
|
|
|
type BackupOptions struct {
|
|
master *string
|
|
server *string // deprecated, for backward compatibility
|
|
collection *string
|
|
dir *string
|
|
volumeId *int
|
|
ttl *string
|
|
replication *string
|
|
}
|
|
|
|
func init() {
|
|
cmdBackup.Run = runBackup // break init cycle
|
|
s.master = cmdBackup.Flag.String("master", "localhost:9333", "SeaweedFS master location")
|
|
s.server = cmdBackup.Flag.String("server", "", "SeaweedFS master location (deprecated, use -master instead)")
|
|
s.collection = cmdBackup.Flag.String("collection", "", "collection name")
|
|
s.dir = cmdBackup.Flag.String("dir", ".", "directory to store volume data files")
|
|
s.volumeId = cmdBackup.Flag.Int("volumeId", -1, "a volume id. The volume .dat and .idx files should already exist in the dir.")
|
|
s.ttl = cmdBackup.Flag.String("ttl", "", `backup volume's time to live, format:
|
|
3m: 3 minutes
|
|
4h: 4 hours
|
|
5d: 5 days
|
|
6w: 6 weeks
|
|
7M: 7 months
|
|
8y: 8 years
|
|
default is the same with origin`)
|
|
s.replication = cmdBackup.Flag.String("replication", "", "backup volume's replication, default is the same with origin")
|
|
}
|
|
|
|
var cmdBackup = &Command{
|
|
UsageLine: "backup -dir=. -volumeId=234 -master=localhost:9333",
|
|
Short: "incrementally backup a volume to local folder",
|
|
Long: `Incrementally backup volume data.
|
|
|
|
It is expected that you use this inside a script, to loop through
|
|
all possible volume ids that needs to be backup to local folder.
|
|
|
|
The volume id does not need to exist locally or even remotely.
|
|
This will help to backup future new volumes.
|
|
|
|
Usually backing up is just copying the .dat (and .idx) files.
|
|
But it's tricky to incrementally copy the differences.
|
|
|
|
The complexity comes when there are multiple addition, deletion and compaction.
|
|
This tool will handle them correctly and efficiently, avoiding unnecessary data transportation.
|
|
`,
|
|
}
|
|
|
|
// parseTTL parses the TTL from user input or volume stats.
|
|
// Returns (ttl, error, isFatal) where isFatal=true for invalid user input.
|
|
func parseTTL(userTTL string, statsTTL string) (*needle.TTL, error, bool) {
|
|
if userTTL != "" {
|
|
ttl, err := needle.ReadTTL(userTTL)
|
|
if err != nil {
|
|
// User-provided TTL is invalid - this is fatal
|
|
return nil, fmt.Errorf("invalid user-provided ttl %s: %w", userTTL, err), true
|
|
}
|
|
return ttl, nil, false
|
|
}
|
|
|
|
ttl, err := needle.ReadTTL(statsTTL)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("parsing ttl %s from stats: %w", statsTTL, err), false
|
|
}
|
|
return ttl, nil, false
|
|
}
|
|
|
|
// parseReplication parses the replication from user input or volume stats.
|
|
// Returns (replication, error, isFatal) where isFatal=true for invalid user input.
|
|
func parseReplication(userReplication string, statsReplication string) (*super_block.ReplicaPlacement, error, bool) {
|
|
if userReplication != "" {
|
|
replication, err := super_block.NewReplicaPlacementFromString(userReplication)
|
|
if err != nil {
|
|
// User-provided replication is invalid - this is fatal
|
|
return nil, fmt.Errorf("invalid user-provided replication %s: %w", userReplication, err), true
|
|
}
|
|
return replication, nil, false
|
|
}
|
|
|
|
replication, err := super_block.NewReplicaPlacementFromString(statsReplication)
|
|
if err != nil {
|
|
return nil, fmt.Errorf("parsing replication %s from stats: %w", statsReplication, err), false
|
|
}
|
|
return replication, nil, false
|
|
}
|
|
|
|
// backupFromLocation attempts to backup a volume from a specific volume server location.
|
|
// Returns (error, isFatal) where isFatal=true means the error is due to invalid user input
|
|
// and should not be retried with other locations.
|
|
func backupFromLocation(volumeServer pb.ServerAddress, grpcDialOption grpc.DialOption, vid needle.VolumeId) (error, bool) {
|
|
stats, err := operation.GetVolumeSyncStatus(volumeServer, grpcDialOption, uint32(vid))
|
|
if err != nil {
|
|
return fmt.Errorf("getting volume status: %w", err), false
|
|
}
|
|
|
|
// Parse TTL
|
|
ttl, err, isFatal := parseTTL(*s.ttl, stats.Ttl)
|
|
if err != nil {
|
|
return err, isFatal
|
|
}
|
|
|
|
// Parse replication
|
|
replication, err, isFatal := parseReplication(*s.replication, stats.Replication)
|
|
if err != nil {
|
|
return err, isFatal
|
|
}
|
|
|
|
ver := needle.Version(stats.Version)
|
|
|
|
// Create or load the volume
|
|
v, err := storage.NewVolume(util.ResolvePath(*s.dir), util.ResolvePath(*s.dir), *s.collection, vid, storage.NeedleMapInMemory, replication, ttl, 0, ver, 0, 0)
|
|
if err != nil {
|
|
return fmt.Errorf("creating or reading volume: %w", err), false
|
|
}
|
|
|
|
// Handle compaction if needed
|
|
if v.SuperBlock.CompactionRevision < uint16(stats.CompactRevision) {
|
|
if err = v.Compact2(0, 0, nil); err != nil {
|
|
v.Close()
|
|
return fmt.Errorf("compacting volume: %w", err), false
|
|
}
|
|
if err = v.CommitCompact(); err != nil {
|
|
v.Close()
|
|
return fmt.Errorf("committing compaction: %w", err), false
|
|
}
|
|
v.SuperBlock.CompactionRevision = uint16(stats.CompactRevision)
|
|
if _, err = v.DataBackend.WriteAt(v.SuperBlock.Bytes(), 0); err != nil {
|
|
v.Close()
|
|
return fmt.Errorf("writing superblock: %w", err), false
|
|
}
|
|
}
|
|
|
|
datSize, _, _ := v.FileStat()
|
|
|
|
// If local volume is larger than remote, recreate it
|
|
if datSize > stats.TailOffset {
|
|
if err := v.Destroy(false); err != nil {
|
|
v.Close()
|
|
return fmt.Errorf("destroying volume: %w", err), false
|
|
}
|
|
v.Close() // Close the destroyed volume
|
|
// recreate an empty volume
|
|
v, err = storage.NewVolume(util.ResolvePath(*s.dir), util.ResolvePath(*s.dir), *s.collection, vid, storage.NeedleMapInMemory, replication, ttl, 0, ver, 0, 0)
|
|
if err != nil {
|
|
return fmt.Errorf("recreating volume: %w", err), false
|
|
}
|
|
}
|
|
|
|
// Perform the incremental backup
|
|
if err := v.IncrementalBackup(volumeServer, grpcDialOption); err != nil {
|
|
v.Close()
|
|
return fmt.Errorf("incremental backup: %w", err), false
|
|
}
|
|
|
|
v.Close()
|
|
return nil, false
|
|
}
|
|
|
|
func runBackup(cmd *Command, args []string) bool {
|
|
|
|
util.LoadSecurityConfiguration()
|
|
grpcDialOption := security.LoadClientTLS(util.GetViper(), "grpc.client")
|
|
|
|
// Backward compatibility: if -server is provided, use it
|
|
masterServer := *s.master
|
|
if *s.server != "" {
|
|
masterServer = *s.server
|
|
}
|
|
|
|
if *s.volumeId == -1 {
|
|
return false
|
|
}
|
|
vid := needle.VolumeId(*s.volumeId)
|
|
|
|
// find volume location, replication, ttl info
|
|
lookup, err := operation.LookupVolumeId(func(_ context.Context) pb.ServerAddress { return pb.ServerAddress(masterServer) }, grpcDialOption, vid.String())
|
|
if err != nil {
|
|
fmt.Printf("Error looking up volume %d: %v\n", vid, err)
|
|
return true
|
|
}
|
|
if len(lookup.Locations) == 0 {
|
|
fmt.Printf("Error: volume %d has no locations available\n", vid)
|
|
return true
|
|
}
|
|
|
|
// Try each available location until one succeeds
|
|
var lastErr error
|
|
for i, location := range lookup.Locations {
|
|
volumeServer := location.ServerAddress()
|
|
fmt.Printf("Attempting to backup volume %d from location %d/%d: %s\n", vid, i+1, len(lookup.Locations), volumeServer)
|
|
|
|
err, isFatal := backupFromLocation(volumeServer, grpcDialOption, vid)
|
|
if err != nil {
|
|
fmt.Printf("Error backing up volume %d from %s: %v\n", vid, volumeServer, err)
|
|
lastErr = err
|
|
// Check if this is a fatal user-input error
|
|
if isFatal {
|
|
return true
|
|
}
|
|
continue
|
|
}
|
|
|
|
// Success!
|
|
fmt.Printf("Successfully backed up volume %d from %s\n", vid, volumeServer)
|
|
return true
|
|
}
|
|
|
|
// All locations failed
|
|
fmt.Printf("Failed to backup volume %d after trying all %d locations. Last error: %v\n", vid, len(lookup.Locations), lastErr)
|
|
|
|
return true
|
|
}
|