@ -113,6 +113,50 @@ var (
getDefaultReplicaPlacement = _getDefaultReplicaPlacement
getDefaultReplicaPlacement = _getDefaultReplicaPlacement
)
)
type ErrorWaitGroup struct {
parallelize bool
wg * sync . WaitGroup
errors [ ] error
errorsMu sync . Mutex
}
type ErrorWaitGroupTask func ( ) error
func ( ewg * ErrorWaitGroup ) Init ( ) {
if ewg . wg != nil {
return
}
ewg . wg = & sync . WaitGroup { }
ewg . errors = nil
}
func ( ewg * ErrorWaitGroup ) Add ( f ErrorWaitGroupTask ) {
if ewg . wg == nil || ! ewg . parallelize {
ewg . errors = append ( ewg . errors , f ( ) )
return
}
ewg . wg . Add ( 1 )
go func ( ) {
err := f ( )
ewg . errorsMu . Lock ( )
ewg . errors = append ( ewg . errors , err )
ewg . errorsMu . Unlock ( )
ewg . wg . Done ( )
} ( )
}
func ( ewg * ErrorWaitGroup ) Wait ( ) error {
if ewg . wg != nil {
ewg . wg . Wait ( )
}
err := errors . Join ( ewg . errors ... )
ewg . wg = nil
ewg . errors = nil
return err
}
func _getDefaultReplicaPlacement ( commandEnv * CommandEnv ) ( * super_block . ReplicaPlacement , error ) {
func _getDefaultReplicaPlacement ( commandEnv * CommandEnv ) ( * super_block . ReplicaPlacement , error ) {
var resp * master_pb . GetMasterConfigurationResponse
var resp * master_pb . GetMasterConfigurationResponse
var err error
var err error
@ -557,48 +601,8 @@ type ecBalancer struct {
ecNodes [ ] * EcNode
ecNodes [ ] * EcNode
replicaPlacement * super_block . ReplicaPlacement
replicaPlacement * super_block . ReplicaPlacement
applyBalancing bool
applyBalancing bool
parallelize bool
wg * sync . WaitGroup
wgErrors [ ] error
}
type ecBalancerTask func ( ) error
func ( ecb * ecBalancer ) wgInit ( ) {
if ecb . wg != nil {
return
}
ecb . wg = & sync . WaitGroup { }
ecb . wgErrors = nil
}
func ( ecb * ecBalancer ) wgAdd ( f ecBalancerTask ) {
if ecb . wg == nil || ! ecb . parallelize {
if err := f ( ) ; err != nil {
ecb . wgErrors = append ( ecb . wgErrors , err )
}
return
}
ecb . wg . Add ( 1 )
go func ( ) {
if err := f ( ) ; err != nil {
ecb . wgErrors = append ( ecb . wgErrors , err )
}
ecb . wg . Done ( )
} ( )
}
func ( ecb * ecBalancer ) wgWait ( ) error {
if ecb . wg != nil {
ecb . wg . Wait ( )
}
err := errors . Join ( ecb . wgErrors ... )
ecb . wg = nil
ecb . wgErrors = nil
return err
ewg ErrorWaitGroup
}
}
func ( ecb * ecBalancer ) racks ( ) map [ RackId ] * EcRack {
func ( ecb * ecBalancer ) racks ( ) map [ RackId ] * EcRack {
@ -637,13 +641,13 @@ func (ecb *ecBalancer) balanceEcVolumes(collection string) error {
func ( ecb * ecBalancer ) deleteDuplicatedEcShards ( collection string ) error {
func ( ecb * ecBalancer ) deleteDuplicatedEcShards ( collection string ) error {
vidLocations := ecb . collectVolumeIdToEcNodes ( collection )
vidLocations := ecb . collectVolumeIdToEcNodes ( collection )
ecb . wg Init( )
ecb . ewg . Init ( )
for vid , locations := range vidLocations {
for vid , locations := range vidLocations {
ecb . wg Add( func ( ) error {
ecb . ewg . Add ( func ( ) error {
return ecb . doDeduplicateEcShards ( collection , vid , locations )
return ecb . doDeduplicateEcShards ( collection , vid , locations )
} )
} )
}
}
return ecb . wg Wait( )
return ecb . ewg . Wait ( )
}
}
func ( ecb * ecBalancer ) doDeduplicateEcShards ( collection string , vid needle . VolumeId , locations [ ] * EcNode ) error {
func ( ecb * ecBalancer ) doDeduplicateEcShards ( collection string , vid needle . VolumeId , locations [ ] * EcNode ) error {
@ -684,13 +688,13 @@ func (ecb *ecBalancer) balanceEcShardsAcrossRacks(collection string) error {
vidLocations := ecb . collectVolumeIdToEcNodes ( collection )
vidLocations := ecb . collectVolumeIdToEcNodes ( collection )
// spread the ec shards evenly
// spread the ec shards evenly
ecb . wg Init( )
ecb . ewg . Init ( )
for vid , locations := range vidLocations {
for vid , locations := range vidLocations {
ecb . wg Add( func ( ) error {
ecb . ewg . Add ( func ( ) error {
return ecb . doBalanceEcShardsAcrossRacks ( collection , vid , locations )
return ecb . doBalanceEcShardsAcrossRacks ( collection , vid , locations )
} )
} )
}
}
return ecb . wg Wait( )
return ecb . ewg . Wait ( )
}
}
func countShardsByRack ( vid needle . VolumeId , locations [ ] * EcNode ) map [ string ] int {
func countShardsByRack ( vid needle . VolumeId , locations [ ] * EcNode ) map [ string ] int {
@ -792,7 +796,7 @@ func (ecb *ecBalancer) balanceEcShardsWithinRacks(collection string) error {
racks := ecb . racks ( )
racks := ecb . racks ( )
// spread the ec shards evenly
// spread the ec shards evenly
ecb . wg Init( )
ecb . ewg . Init ( )
for vid , locations := range vidLocations {
for vid , locations := range vidLocations {
// see the volume's shards are in how many racks, and how many in each rack
// see the volume's shards are in how many racks, and how many in each rack
@ -811,12 +815,12 @@ func (ecb *ecBalancer) balanceEcShardsWithinRacks(collection string) error {
}
}
sourceEcNodes := rackEcNodesWithVid [ rackId ]
sourceEcNodes := rackEcNodesWithVid [ rackId ]
averageShardsPerEcNode := ceilDivide ( rackToShardCount [ rackId ] , len ( possibleDestinationEcNodes ) )
averageShardsPerEcNode := ceilDivide ( rackToShardCount [ rackId ] , len ( possibleDestinationEcNodes ) )
ecb . wg Add( func ( ) error {
ecb . ewg . Add ( func ( ) error {
return ecb . doBalanceEcShardsWithinOneRack ( averageShardsPerEcNode , collection , vid , sourceEcNodes , possibleDestinationEcNodes )
return ecb . doBalanceEcShardsWithinOneRack ( averageShardsPerEcNode , collection , vid , sourceEcNodes , possibleDestinationEcNodes )
} )
} )
}
}
}
}
return ecb . wg Wait( )
return ecb . ewg . Wait ( )
}
}
func ( ecb * ecBalancer ) doBalanceEcShardsWithinOneRack ( averageShardsPerEcNode int , collection string , vid needle . VolumeId , existingLocations , possibleDestinationEcNodes [ ] * EcNode ) error {
func ( ecb * ecBalancer ) doBalanceEcShardsWithinOneRack ( averageShardsPerEcNode int , collection string , vid needle . VolumeId , existingLocations , possibleDestinationEcNodes [ ] * EcNode ) error {
@ -847,13 +851,13 @@ func (ecb *ecBalancer) doBalanceEcShardsWithinOneRack(averageShardsPerEcNode int
func ( ecb * ecBalancer ) balanceEcRacks ( ) error {
func ( ecb * ecBalancer ) balanceEcRacks ( ) error {
// balance one rack for all ec shards
// balance one rack for all ec shards
ecb . wg Init( )
ecb . ewg . Init ( )
for _ , ecRack := range ecb . racks ( ) {
for _ , ecRack := range ecb . racks ( ) {
ecb . wg Add( func ( ) error {
ecb . ewg . Add ( func ( ) error {
return ecb . doBalanceEcRack ( ecRack )
return ecb . doBalanceEcRack ( ecRack )
} )
} )
}
}
return ecb . wg Wait( )
return ecb . ewg . Wait ( )
}
}
func ( ecb * ecBalancer ) doBalanceEcRack ( ecRack * EcRack ) error {
func ( ecb * ecBalancer ) doBalanceEcRack ( ecRack * EcRack ) error {
@ -1067,7 +1071,10 @@ func EcBalance(commandEnv *CommandEnv, collections []string, dc string, ecReplic
ecNodes : allEcNodes ,
ecNodes : allEcNodes ,
replicaPlacement : ecReplicaPlacement ,
replicaPlacement : ecReplicaPlacement ,
applyBalancing : applyBalancing ,
applyBalancing : applyBalancing ,
parallelize : parallelize ,
ewg : ErrorWaitGroup {
parallelize : parallelize ,
} ,
}
}
for _ , c := range collections {
for _ , c := range collections {