You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
144 lines
4.6 KiB
144 lines
4.6 KiB
package shell
|
|
|
|
import (
|
|
"context"
|
|
"flag"
|
|
"fmt"
|
|
"io"
|
|
"time"
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/pb/master_pb"
|
|
)
|
|
|
|
func init() {
|
|
Commands = append(Commands, &commandRaftLeaderTransfer{})
|
|
}
|
|
|
|
type commandRaftLeaderTransfer struct{}
|
|
|
|
func (c *commandRaftLeaderTransfer) Name() string {
|
|
return "cluster.raft.transferLeader"
|
|
}
|
|
|
|
func (c *commandRaftLeaderTransfer) Help() string {
|
|
return `transfer raft leadership to another master server
|
|
|
|
This command initiates a graceful leadership transfer from the current
|
|
leader to another server. Use this before performing maintenance on
|
|
the current leader to reduce errors in filers and other components.
|
|
|
|
Examples:
|
|
# Transfer to any eligible follower (auto-selection)
|
|
cluster.raft.transferLeader
|
|
|
|
# Transfer to a specific server
|
|
cluster.raft.transferLeader -id <server_id> -address <server_grpc_address>
|
|
|
|
Notes:
|
|
- Requires hashicorp raft (-raftHashicorp=true on master)
|
|
- This command must be sent to the current leader
|
|
- The target server must be a voting member of the raft cluster
|
|
- Use 'cluster.raft.ps' to list available servers and identify the leader
|
|
`
|
|
}
|
|
|
|
func (c *commandRaftLeaderTransfer) HasTag(CommandTag) bool {
|
|
return false
|
|
}
|
|
|
|
func (c *commandRaftLeaderTransfer) Do(args []string, commandEnv *CommandEnv, writer io.Writer) error {
|
|
leaderTransferCommand := flag.NewFlagSet(c.Name(), flag.ContinueOnError)
|
|
targetId := leaderTransferCommand.String("id", "", "target server id (must be used with -address)")
|
|
targetAddress := leaderTransferCommand.String("address", "", "target server grpc address (must be used with -id)")
|
|
|
|
if err := leaderTransferCommand.Parse(args); err != nil {
|
|
return err
|
|
}
|
|
|
|
// Validate: id and address must be specified together
|
|
if *targetId != "" && *targetAddress == "" {
|
|
return fmt.Errorf("-address is required when -id is specified")
|
|
}
|
|
if *targetAddress != "" && *targetId == "" {
|
|
return fmt.Errorf("-id is required when -address is specified")
|
|
}
|
|
|
|
// First, show current cluster status
|
|
fmt.Fprintf(writer, "Checking current raft cluster status...\n")
|
|
|
|
var currentLeader string
|
|
err := commandEnv.MasterClient.WithClient(false, func(client master_pb.SeaweedClient) error {
|
|
ctx, cancel := context.WithTimeout(context.Background(), 10*time.Second)
|
|
defer cancel()
|
|
|
|
resp, err := client.RaftListClusterServers(ctx, &master_pb.RaftListClusterServersRequest{})
|
|
if err != nil {
|
|
return fmt.Errorf("failed to list cluster servers: %v", err)
|
|
}
|
|
|
|
if len(resp.ClusterServers) == 0 {
|
|
fmt.Fprintf(writer, "No raft cluster configured (single master mode)\n")
|
|
return fmt.Errorf("leadership transfer not available in single master mode")
|
|
}
|
|
|
|
fmt.Fprintf(writer, "Raft cluster has %d servers:\n", len(resp.ClusterServers))
|
|
for _, server := range resp.ClusterServers {
|
|
suffix := ""
|
|
if server.IsLeader {
|
|
suffix = " <- current leader"
|
|
currentLeader = server.Id
|
|
}
|
|
fmt.Fprintf(writer, " %s %s [%s]%s\n", server.Id, server.Address, server.Suffrage, suffix)
|
|
}
|
|
return nil
|
|
})
|
|
if err != nil {
|
|
return err
|
|
}
|
|
|
|
if currentLeader == "" {
|
|
return fmt.Errorf("no leader found in cluster")
|
|
}
|
|
|
|
// Perform the transfer
|
|
targetDesc := "any eligible follower"
|
|
if *targetId != "" {
|
|
targetDesc = fmt.Sprintf("server %s (%s)", *targetId, *targetAddress)
|
|
}
|
|
fmt.Fprintf(writer, "\nTransferring leadership from %s to %s...\n", currentLeader, targetDesc)
|
|
|
|
err = commandEnv.MasterClient.WithClient(true, func(client master_pb.SeaweedClient) error {
|
|
ctx, cancel := context.WithTimeout(context.Background(), 30*time.Second)
|
|
defer cancel()
|
|
|
|
resp, err := client.RaftLeadershipTransfer(ctx, &master_pb.RaftLeadershipTransferRequest{
|
|
TargetId: *targetId,
|
|
TargetAddress: *targetAddress,
|
|
})
|
|
if err != nil {
|
|
return fmt.Errorf("leadership transfer failed: %v", err)
|
|
}
|
|
|
|
if resp.PreviousLeader != resp.NewLeader {
|
|
fmt.Fprintf(writer, "Leadership successfully transferred.\n")
|
|
fmt.Fprintf(writer, " Previous leader: %s\n", resp.PreviousLeader)
|
|
fmt.Fprintf(writer, " New leader: %s\n", resp.NewLeader)
|
|
} else {
|
|
fmt.Fprintf(writer, "Leadership transfer initiated, but the same leader was re-elected.\n")
|
|
fmt.Fprintf(writer, " Current leader: %s\n", resp.NewLeader)
|
|
}
|
|
return nil
|
|
})
|
|
|
|
if err != nil {
|
|
fmt.Fprintf(writer, "\nLeadership transfer failed: %v\n", err)
|
|
fmt.Fprintf(writer, "\nTroubleshooting:\n")
|
|
fmt.Fprintf(writer, " - Ensure you are connected to the current leader\n")
|
|
fmt.Fprintf(writer, " - Ensure target server is a voting member (use 'cluster.raft.ps')\n")
|
|
fmt.Fprintf(writer, " - Ensure target server is healthy and reachable\n")
|
|
return err
|
|
}
|
|
|
|
return nil
|
|
}
|
|
|