seaweedfs/sw-block/engine/replication/driver.go


								package replication


								import "fmt"


								// === Phase 06: Execution Driver ===

								//

								// Convenience flow classification (Phase 06 P0):

								//

								//   ProcessAssignment      → stepwise engine task (real entry point)

								//   ExecuteRecovery        → planner (connect + classify outcome)

								//   CompleteCatchUp        → TEST-ONLY convenience (bundles plan+execute+complete)

								//   CompleteRebuild        → TEST-ONLY convenience (bundles plan+execute+complete)

								//   UpdateSenderEpoch      → stepwise engine task

								//   InvalidateEpoch        → stepwise engine task

								//

								// The real engine flow splits catch-up and rebuild into:

								//   1. Plan: acquire resources (pin WAL or snapshot)

								//   2. Execute: stream entries stepwise (not one-shot)

								//   3. Complete: release resources, transition to InSync

								//

								// RecoveryDriver is the Phase 06 replacement for the synchronous

								// convenience helpers. It plans, acquires resources, and provides

								// a stepwise execution interface.


								// RecoveryPlan represents a planned recovery operation with acquired resources.

								// The executor consumes this plan — it does not re-derive policy.

								type RecoveryPlan struct {

									ReplicaID    string

									SessionID    uint64

									Outcome      RecoveryOutcome

									Proof        *RecoverabilityProof


									// Resource pins (non-nil when resources are acquired).

									RetentionPin *RetentionPin // for catch-up or snapshot+tail rebuild

									SnapshotPin  *SnapshotPin  // for snapshot+tail rebuild

									FullBasePin  *FullBasePin  // for full-base rebuild


									// Catch-up targets (bound at plan time).

									CatchUpTarget uint64 // for catch-up: committed LSN at plan time

									TruncateLSN   uint64 // non-zero if truncation required


									// Rebuild targets (bound at plan time).

									RebuildSource     RebuildSource

									RebuildSnapshotLSN uint64 // for snapshot+tail: the snapshot LSN

									RebuildTargetLSN   uint64 // committed LSN at plan time

								}


								// RecoveryDriver plans and executes recovery operations using real

								// storage adapter inputs. It replaces the synchronous convenience

								// helpers (CompleteCatchUp, CompleteRebuild) with a resource-aware,

								// stepwise execution model.

								type RecoveryDriver struct {

									Orchestrator *RecoveryOrchestrator

									Storage      StorageAdapter

								}


								// NewRecoveryDriver creates a driver with a fresh orchestrator.

								func NewRecoveryDriver(storage StorageAdapter) *RecoveryDriver {

									return &RecoveryDriver{

										Orchestrator: NewRecoveryOrchestrator(),

										Storage:      storage,

									}

								}


								// PlanRecovery connects, handshakes from real storage state, classifies

								// the outcome, and acquires the necessary resources (WAL pin or snapshot pin).

								// Returns a RecoveryPlan that the caller can execute stepwise.

								func (d *RecoveryDriver) PlanRecovery(replicaID string, replicaFlushedLSN uint64) (*RecoveryPlan, error) {

									history := d.Storage.GetRetainedHistory()


									result := d.Orchestrator.ExecuteRecovery(replicaID, replicaFlushedLSN, &history)

									if result.Error != nil {

										return nil, result.Error

									}


									s := d.Orchestrator.Registry.Sender(replicaID)

									plan := &RecoveryPlan{

										ReplicaID: replicaID,

										SessionID: s.SessionID(),

										Outcome:   result.Outcome,

										Proof:     result.Proof,

									}


									switch result.Outcome {

									case OutcomeZeroGap:

										// Already completed by ExecuteRecovery.

										return plan, nil


									case OutcomeCatchUp:

										plan.CatchUpTarget = history.CommittedLSN


										// Check if truncation is needed (replica ahead).

										proof := history.ProveRecoverability(replicaFlushedLSN)

										if proof.Reason == "replica_ahead_needs_truncation" {

											plan.TruncateLSN = history.CommittedLSN

											// Truncation-only: no WAL replay needed. No pin required.

											d.Orchestrator.Log.Record(replicaID, plan.SessionID, "plan_truncate_only",

												fmt.Sprintf("truncate_to=%d", plan.TruncateLSN))

											return plan, nil

										}


										// Real catch-up: pin WAL from the session's actual replay start.

										// The replay start is replicaFlushedLSN (where the replica left off).

										replayStart := replicaFlushedLSN

										pin, err := d.Storage.PinWALRetention(replayStart)

										if err != nil {

											s.InvalidateSession("wal_pin_failed", StateDisconnected)

											d.Orchestrator.Log.Record(replicaID, plan.SessionID, "wal_pin_failed", err.Error())

											return nil, fmt.Errorf("WAL retention pin failed: %w", err)

										}

										plan.RetentionPin = &pin


										d.Orchestrator.Log.Record(replicaID, plan.SessionID, "plan_catchup",

											fmt.Sprintf("replay=%d→%d pin=%d", replayStart, plan.CatchUpTarget, pin.PinID))

										return plan, nil


									case OutcomeNeedsRebuild:

										// No resource acquisition — needs rebuild assignment first.

										return plan, nil

									}


									return plan, nil

								}


								// PlanRebuild acquires rebuild resources (snapshot pin + optional WAL pin)

								// from real storage state. Called after a rebuild assignment.

								// Fails closed on: missing sender, no active session, non-rebuild session.

								func (d *RecoveryDriver) PlanRebuild(replicaID string) (*RecoveryPlan, error) {

									s := d.Orchestrator.Registry.Sender(replicaID)

									if s == nil {

										return nil, fmt.Errorf("sender %q not found", replicaID)

									}

									sessID := s.SessionID()

									if sessID == 0 {

										return nil, fmt.Errorf("no active session for %q", replicaID)

									}

									snap := s.SessionSnapshot()

									if snap == nil || snap.Kind != SessionRebuild {

										return nil, fmt.Errorf("session for %q is not a rebuild session (kind=%s)", replicaID, snap.Kind)

									}


									history := d.Storage.GetRetainedHistory()

									source, snapLSN := history.RebuildSourceDecision()


									plan := &RecoveryPlan{

										ReplicaID:          replicaID,

										SessionID:          sessID,

										Outcome:            OutcomeNeedsRebuild,

										RebuildSource:      source,

										RebuildSnapshotLSN: snapLSN,

										RebuildTargetLSN:   history.CommittedLSN,

									}


									if source == RebuildSnapshotTail {

										// Pin snapshot.

										snapPin, err := d.Storage.PinSnapshot(snapLSN)

										if err != nil {

											s.InvalidateSession("snapshot_pin_failed", StateNeedsRebuild)

											d.Orchestrator.Log.Record(replicaID, plan.SessionID, "snapshot_pin_failed", err.Error())

											return nil, fmt.Errorf("snapshot pin failed: %w", err)

										}

										plan.SnapshotPin = &snapPin


										// Pin WAL retention for tail replay.

										retPin, err := d.Storage.PinWALRetention(snapLSN)

										if err != nil {

											d.Storage.ReleaseSnapshot(snapPin)

											s.InvalidateSession("wal_pin_failed_during_rebuild", StateNeedsRebuild)

											d.Orchestrator.Log.Record(replicaID, plan.SessionID, "wal_pin_failed", err.Error())

											return nil, fmt.Errorf("WAL retention pin failed: %w", err)

										}

										plan.RetentionPin = &retPin


										d.Orchestrator.Log.Record(replicaID, plan.SessionID, "plan_rebuild_snapshot_tail",

											fmt.Sprintf("snapshot=%d", snapLSN))

									} else {

										// Full-base rebuild: pin a consistent full-extent base image.

										basePin, err := d.Storage.PinFullBase(history.CommittedLSN)

										if err != nil {

											// Fail closed: invalidate session so sender is not left dangling.

											s.InvalidateSession("full_base_pin_failed", StateNeedsRebuild)

											d.Orchestrator.Log.Record(replicaID, plan.SessionID, "full_base_pin_failed", err.Error())

											return nil, fmt.Errorf("full base pin failed: %w", err)

										}

										plan.FullBasePin = &basePin


										// Log causal reason for full-base selection.

										reason := "no_checkpoint"

										if history.CheckpointLSN > 0 && !history.CheckpointTrusted {

											reason = "untrusted_checkpoint"

										} else if history.CheckpointTrusted && !history.IsRecoverable(history.CheckpointLSN, history.CommittedLSN) {

											reason = fmt.Sprintf("trusted_checkpoint_unreplayable_tail: checkpoint=%d tail=%d",

												history.CheckpointLSN, history.TailLSN)

										}

										d.Orchestrator.Log.Record(replicaID, plan.SessionID, "plan_rebuild_full_base",

											fmt.Sprintf("reason=%s committed=%d", reason, history.CommittedLSN))

									}


									return plan, nil

								}


								// CancelPlan releases all resources and invalidates the associated session.

								// Used when a plan becomes stale (e.g., address change, epoch bump).

								func (d *RecoveryDriver) CancelPlan(plan *RecoveryPlan, reason string) {

									d.ReleasePlan(plan)

									s := d.Orchestrator.Registry.Sender(plan.ReplicaID)

									if s != nil && s.SessionID() == plan.SessionID {

										s.InvalidateSession(reason, StateDisconnected)

									}

									d.Orchestrator.Log.Record(plan.ReplicaID, plan.SessionID, "plan_cancelled", reason)

								}


								// ReleasePlan releases any resources acquired by a plan.

								func (d *RecoveryDriver) ReleasePlan(plan *RecoveryPlan) {

									if plan.RetentionPin != nil {

										d.Storage.ReleaseWALRetention(*plan.RetentionPin)

										plan.RetentionPin = nil

									}

									if plan.SnapshotPin != nil {

										d.Storage.ReleaseSnapshot(*plan.SnapshotPin)

										plan.SnapshotPin = nil

									}

									if plan.FullBasePin != nil {

										d.Storage.ReleaseFullBase(*plan.FullBasePin)

										plan.FullBasePin = nil

									}

								}