|
@ -1,9 +1,9 @@ |
|
|
package sub_coordinator |
|
|
package sub_coordinator |
|
|
|
|
|
|
|
|
import ( |
|
|
import ( |
|
|
|
|
|
"fmt" |
|
|
cmap "github.com/orcaman/concurrent-map/v2" |
|
|
cmap "github.com/orcaman/concurrent-map/v2" |
|
|
"github.com/seaweedfs/seaweedfs/weed/glog" |
|
|
"github.com/seaweedfs/seaweedfs/weed/glog" |
|
|
"github.com/seaweedfs/seaweedfs/weed/mq/pub_balancer" |
|
|
|
|
|
"github.com/seaweedfs/seaweedfs/weed/mq/topic" |
|
|
"github.com/seaweedfs/seaweedfs/weed/mq/topic" |
|
|
"github.com/seaweedfs/seaweedfs/weed/pb/mq_pb" |
|
|
"github.com/seaweedfs/seaweedfs/weed/pb/mq_pb" |
|
|
"time" |
|
|
"time" |
|
@ -13,128 +13,97 @@ type ConsumerGroup struct { |
|
|
topic topic.Topic |
|
|
topic topic.Topic |
|
|
// map a consumer group instance id to a consumer group instance
|
|
|
// map a consumer group instance id to a consumer group instance
|
|
|
ConsumerGroupInstances cmap.ConcurrentMap[string, *ConsumerGroupInstance] |
|
|
ConsumerGroupInstances cmap.ConcurrentMap[string, *ConsumerGroupInstance] |
|
|
mapping *PartitionConsumerMapping |
|
|
|
|
|
|
|
|
Market *Market |
|
|
reBalanceTimer *time.Timer |
|
|
reBalanceTimer *time.Timer |
|
|
pubBalancer *pub_balancer.PubBalancer |
|
|
|
|
|
filerClientAccessor *FilerClientAccessor |
|
|
filerClientAccessor *FilerClientAccessor |
|
|
|
|
|
stopCh chan struct{} |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func NewConsumerGroup(t *mq_pb.Topic, pubBalancer *pub_balancer.PubBalancer, filerClientAccessor *FilerClientAccessor) *ConsumerGroup { |
|
|
|
|
|
return &ConsumerGroup{ |
|
|
|
|
|
|
|
|
func NewConsumerGroup(t *mq_pb.Topic, reblanceSeconds int32, filerClientAccessor *FilerClientAccessor) *ConsumerGroup { |
|
|
|
|
|
cg := &ConsumerGroup{ |
|
|
topic: topic.FromPbTopic(t), |
|
|
topic: topic.FromPbTopic(t), |
|
|
ConsumerGroupInstances: cmap.New[*ConsumerGroupInstance](), |
|
|
ConsumerGroupInstances: cmap.New[*ConsumerGroupInstance](), |
|
|
mapping: NewPartitionConsumerMapping(pub_balancer.MaxPartitionCount), |
|
|
|
|
|
pubBalancer: pubBalancer, |
|
|
|
|
|
filerClientAccessor: filerClientAccessor, |
|
|
filerClientAccessor: filerClientAccessor, |
|
|
} |
|
|
} |
|
|
|
|
|
if conf, err := cg.filerClientAccessor.ReadTopicConfFromFiler(cg.topic); err == nil { |
|
|
|
|
|
var partitions []topic.Partition |
|
|
|
|
|
for _, assignment := range conf.BrokerPartitionAssignments { |
|
|
|
|
|
partitions = append(partitions, topic.FromPbPartition(assignment.Partition)) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func (cg *ConsumerGroup) OnAddConsumerGroupInstance(consumerGroupInstance string, topic *mq_pb.Topic, maxPartitionCount, rebalanceSeconds int32) { |
|
|
|
|
|
cg.onConsumerGroupInstanceChange(true, "add consumer instance "+consumerGroupInstance, maxPartitionCount, rebalanceSeconds) |
|
|
|
|
|
} |
|
|
|
|
|
func (cg *ConsumerGroup) OnRemoveConsumerGroupInstance(consumerGroupInstance string, topic *mq_pb.Topic, maxPartitionCount, rebalanceSeconds int32) { |
|
|
|
|
|
cg.onConsumerGroupInstanceChange(false, "remove consumer instance "+consumerGroupInstance, maxPartitionCount, rebalanceSeconds) |
|
|
|
|
|
|
|
|
cg.Market = NewMarket(partitions, time.Duration(reblanceSeconds)*time.Second) |
|
|
|
|
|
} else { |
|
|
|
|
|
glog.V(0).Infof("fail to read topic conf from filer: %v", err) |
|
|
|
|
|
return nil |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func (cg *ConsumerGroup) onConsumerGroupInstanceChange(isAdd bool, reason string, maxPartitionCount, rebalanceSeconds int32) { |
|
|
|
|
|
if cg.reBalanceTimer != nil { |
|
|
|
|
|
cg.reBalanceTimer.Stop() |
|
|
|
|
|
cg.reBalanceTimer = nil |
|
|
|
|
|
} |
|
|
|
|
|
if maxPartitionCount == 0 { |
|
|
|
|
|
maxPartitionCount = 1 |
|
|
|
|
|
} |
|
|
|
|
|
if rebalanceSeconds == 0 { |
|
|
|
|
|
rebalanceSeconds = 10 |
|
|
|
|
|
|
|
|
go func() { |
|
|
|
|
|
for { |
|
|
|
|
|
select { |
|
|
|
|
|
case adjustment := <-cg.Market.AdjustmentChan: |
|
|
|
|
|
cgi, found := cg.ConsumerGroupInstances.Get(string(adjustment.consumer)) |
|
|
|
|
|
if !found { |
|
|
|
|
|
glog.V(0).Infof("consumer group instance %s not found", adjustment.consumer) |
|
|
|
|
|
continue |
|
|
} |
|
|
} |
|
|
if isAdd { |
|
|
|
|
|
|
|
|
if adjustment.isAssign { |
|
|
if conf, err := cg.filerClientAccessor.ReadTopicConfFromFiler(cg.topic); err == nil { |
|
|
if conf, err := cg.filerClientAccessor.ReadTopicConfFromFiler(cg.topic); err == nil { |
|
|
var sumMaxPartitionCount int32 |
|
|
|
|
|
for _, cgi := range cg.ConsumerGroupInstances.Items() { |
|
|
|
|
|
sumMaxPartitionCount += cgi.MaxPartitionCount |
|
|
|
|
|
} |
|
|
|
|
|
if sumMaxPartitionCount < int32(len(conf.BrokerPartitionAssignments)) && sumMaxPartitionCount+maxPartitionCount >= int32(len(conf.BrokerPartitionAssignments)) { |
|
|
|
|
|
partitionSlotToBrokerList := pub_balancer.NewPartitionSlotToBrokerList(pub_balancer.MaxPartitionCount) |
|
|
|
|
|
for _, assignment := range conf.BrokerPartitionAssignments { |
|
|
for _, assignment := range conf.BrokerPartitionAssignments { |
|
|
partitionSlotToBrokerList.AddBroker(assignment.Partition, assignment.LeaderBroker, assignment.FollowerBroker) |
|
|
|
|
|
} |
|
|
|
|
|
cg.BalanceConsumerGroupInstances(partitionSlotToBrokerList, reason) |
|
|
|
|
|
return |
|
|
|
|
|
} |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
if adjustment.partition.Equals(topic.FromPbPartition(assignment.Partition)) { |
|
|
|
|
|
cgi.ResponseChan <- &mq_pb.SubscriberToSubCoordinatorResponse{ |
|
|
|
|
|
Message: &mq_pb.SubscriberToSubCoordinatorResponse_Assignment_{ |
|
|
|
|
|
Assignment: &mq_pb.SubscriberToSubCoordinatorResponse_Assignment{ |
|
|
|
|
|
PartitionAssignment: &mq_pb.BrokerPartitionAssignment{ |
|
|
|
|
|
Partition: adjustment.partition.ToPbPartition(), |
|
|
|
|
|
LeaderBroker: assignment.LeaderBroker, |
|
|
|
|
|
FollowerBroker: assignment.FollowerBroker, |
|
|
|
|
|
}, |
|
|
|
|
|
}, |
|
|
|
|
|
}, |
|
|
} |
|
|
} |
|
|
cg.reBalanceTimer = time.AfterFunc(time.Duration(rebalanceSeconds)*time.Second, func() { |
|
|
|
|
|
cg.BalanceConsumerGroupInstances(nil, reason) |
|
|
|
|
|
cg.reBalanceTimer = nil |
|
|
|
|
|
}) |
|
|
|
|
|
|
|
|
glog.V(0).Infof("send assignment %v to %s", adjustment.partition, adjustment.consumer) |
|
|
|
|
|
break |
|
|
} |
|
|
} |
|
|
func (cg *ConsumerGroup) OnPartitionListChange(assignments []*mq_pb.BrokerPartitionAssignment) { |
|
|
|
|
|
if cg.reBalanceTimer != nil { |
|
|
|
|
|
cg.reBalanceTimer.Stop() |
|
|
|
|
|
cg.reBalanceTimer = nil |
|
|
|
|
|
} |
|
|
} |
|
|
partitionSlotToBrokerList := pub_balancer.NewPartitionSlotToBrokerList(pub_balancer.MaxPartitionCount) |
|
|
|
|
|
for _, assignment := range assignments { |
|
|
|
|
|
partitionSlotToBrokerList.AddBroker(assignment.Partition, assignment.LeaderBroker, assignment.FollowerBroker) |
|
|
|
|
|
} |
|
|
} |
|
|
cg.BalanceConsumerGroupInstances(partitionSlotToBrokerList, "partition list change") |
|
|
|
|
|
|
|
|
} else { |
|
|
|
|
|
cgi.ResponseChan <- &mq_pb.SubscriberToSubCoordinatorResponse{ |
|
|
|
|
|
Message: &mq_pb.SubscriberToSubCoordinatorResponse_UnAssignment_{ |
|
|
|
|
|
UnAssignment: &mq_pb.SubscriberToSubCoordinatorResponse_UnAssignment{ |
|
|
|
|
|
Partition: adjustment.partition.ToPbPartition(), |
|
|
|
|
|
}, |
|
|
|
|
|
}, |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
func (cg *ConsumerGroup) BalanceConsumerGroupInstances(knownPartitionSlotToBrokerList *pub_balancer.PartitionSlotToBrokerList, reason string) { |
|
|
|
|
|
glog.V(0).Infof("rebalance consumer group %s due to %s", cg.topic.String(), reason) |
|
|
|
|
|
|
|
|
|
|
|
// collect current topic partitions
|
|
|
|
|
|
partitionSlotToBrokerList := knownPartitionSlotToBrokerList |
|
|
|
|
|
if partitionSlotToBrokerList == nil { |
|
|
|
|
|
if conf, err := cg.filerClientAccessor.ReadTopicConfFromFiler(cg.topic); err == nil { |
|
|
|
|
|
partitionSlotToBrokerList = pub_balancer.NewPartitionSlotToBrokerList(pub_balancer.MaxPartitionCount) |
|
|
|
|
|
for _, assignment := range conf.BrokerPartitionAssignments { |
|
|
|
|
|
partitionSlotToBrokerList.AddBroker(assignment.Partition, assignment.LeaderBroker, assignment.FollowerBroker) |
|
|
|
|
|
|
|
|
glog.V(0).Infof("send unassignment %v to %s", adjustment.partition, adjustment.consumer) |
|
|
} |
|
|
} |
|
|
} else { |
|
|
|
|
|
glog.V(0).Infof("fail to read topic conf from filer: %v", err) |
|
|
|
|
|
|
|
|
case <-cg.stopCh: |
|
|
return |
|
|
return |
|
|
} |
|
|
} |
|
|
} |
|
|
} |
|
|
|
|
|
}() |
|
|
|
|
|
|
|
|
// collect current consumer group instance ids
|
|
|
|
|
|
var consumerInstances []*ConsumerGroupInstance |
|
|
|
|
|
for _, consumerGroupInstance := range cg.ConsumerGroupInstances.Items() { |
|
|
|
|
|
consumerInstances = append(consumerInstances, consumerGroupInstance) |
|
|
|
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
cg.mapping.BalanceToConsumerInstances(partitionSlotToBrokerList, consumerInstances) |
|
|
|
|
|
|
|
|
|
|
|
// convert cg.mapping currentMapping to map of consumer group instance id to partition slots
|
|
|
|
|
|
consumerInstanceToPartitionSlots := make(map[ConsumerGroupInstanceId][]*PartitionSlotToConsumerInstance) |
|
|
|
|
|
for _, partitionSlot := range cg.mapping.currentMapping.PartitionSlots { |
|
|
|
|
|
consumerInstanceToPartitionSlots[partitionSlot.AssignedInstanceId] = append(consumerInstanceToPartitionSlots[partitionSlot.AssignedInstanceId], partitionSlot) |
|
|
|
|
|
|
|
|
return cg |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
// notify consumer group instances
|
|
|
|
|
|
for _, consumerGroupInstance := range cg.ConsumerGroupInstances.Items() { |
|
|
|
|
|
partitionSlots, found := consumerInstanceToPartitionSlots[consumerGroupInstance.InstanceId] |
|
|
|
|
|
if !found { |
|
|
|
|
|
partitionSlots = make([]*PartitionSlotToConsumerInstance, 0) |
|
|
|
|
|
} |
|
|
|
|
|
for _, partitionSlot := range partitionSlots { |
|
|
|
|
|
consumerGroupInstance.ResponseChan <- &mq_pb.SubscriberToSubCoordinatorResponse{ |
|
|
|
|
|
Message: &mq_pb.SubscriberToSubCoordinatorResponse_Assignment_{ |
|
|
|
|
|
Assignment: &mq_pb.SubscriberToSubCoordinatorResponse_Assignment{ |
|
|
|
|
|
PartitionAssignment: &mq_pb.BrokerPartitionAssignment{ |
|
|
|
|
|
Partition: &mq_pb.Partition{ |
|
|
|
|
|
RangeStop: partitionSlot.RangeStop, |
|
|
|
|
|
RangeStart: partitionSlot.RangeStart, |
|
|
|
|
|
RingSize: partitionSlotToBrokerList.RingSize, |
|
|
|
|
|
UnixTimeNs: partitionSlot.UnixTimeNs, |
|
|
|
|
|
}, |
|
|
|
|
|
LeaderBroker: partitionSlot.Broker, |
|
|
|
|
|
FollowerBroker: partitionSlot.FollowerBroker, |
|
|
|
|
|
}, |
|
|
|
|
|
}, |
|
|
|
|
|
}, |
|
|
|
|
|
|
|
|
func (cg *ConsumerGroup) AckAssignment(cgi *ConsumerGroupInstance, assignment *mq_pb.SubscriberToSubCoordinatorRequest_AckAssignmentMessage) { |
|
|
|
|
|
fmt.Printf("ack assignment %v\n", assignment) |
|
|
|
|
|
cg.Market.ConfirmAdjustment(&Adjustment{ |
|
|
|
|
|
consumer: cgi.InstanceId, |
|
|
|
|
|
partition: topic.FromPbPartition(assignment.Partition), |
|
|
|
|
|
isAssign: true, |
|
|
|
|
|
}) |
|
|
} |
|
|
} |
|
|
|
|
|
func (cg *ConsumerGroup) AckUnAssignment(cgi *ConsumerGroupInstance, assignment *mq_pb.SubscriberToSubCoordinatorRequest_AckUnAssignmentMessage) { |
|
|
|
|
|
fmt.Printf("ack unassignment %v\n", assignment) |
|
|
|
|
|
cg.Market.ConfirmAdjustment(&Adjustment{ |
|
|
|
|
|
consumer: cgi.InstanceId, |
|
|
|
|
|
partition: topic.FromPbPartition(assignment.Partition), |
|
|
|
|
|
isAssign: false, |
|
|
|
|
|
}) |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
func (cg *ConsumerGroup) OnPartitionListChange(assignments []*mq_pb.BrokerPartitionAssignment) { |
|
|
} |
|
|
} |
|
|
|
|
|
|
|
|
|
|
|
func (cg *ConsumerGroup) Shutdown() { |
|
|
|
|
|
close(cg.stopCh) |
|
|
} |
|
|
} |