ConsumerCoordinator分析

来源：互联网发布：windows 10开机扬声器编辑：程序博客网时间：2024/05/29 04:57

ConsumerCoordinator实现了AbstractCoordinator，主要负责和服务器端GroupCoordinator进行交互

一核心字段

// 心跳任务辅助类

Heartbeat heartbeat;

// 当前消费者所属的消费者组的group id

String groupId;

// 负责网络通信

ConsumerNetworkClient client;

Time time;

long retryBackoffMs;

// 进行心跳检测的线程类

HeartbeatThread heartbeatThread = null;

// 是否需要重新发送JoinGroupRequest

boolean rejoinNeeded = true;

// 是否需要执行发送JoinGroupRequest请求前的准备工作

boolean needsJoinPrepare = true;

// 消费者状态，默认是没有加入消费者组的

MemberState state = MemberState.UNJOINED;

// ConsumerNetworkClient发送JoinGroupRequest请求的结果

RequestFuture<ByteBuffer> joinFuture = null;

// GroopCoordinator所在的Node

Node coordinator = null;

// 服务器端GroopCoordinator返回的信息，用于区分两次rebalance操作，由于网络延迟等问题，在执行rebalance时可能收到上次rebalnace

//过程的请求，为了避免着各种干扰，每一次rebalance操作都会递增generation的值

Generation generation = Generation.NO_GENERATION;

// 分配分区策略的列表，消费者在发送JoinGroupRequest的时候包含自身的PartitionAssignor信息，GroupCoordinator

// 从所有消费者都支持的PartitionAssignor选择一个通知leader使用此分配策略进行分区分配，

// 我们可以通过partition.assignment.strategy设置

List<PartitionAssignor> assignors;

// 记录kafka集群的元数据

Metadata metadata;

ConsumerCoordinatorMetrics sensors;

// 一个跟踪消费者的主题列表，分区列表和offsets的类

SubscriptionState subscriptions;

// 提交offset 的回调类

OffsetCommitCallback defaultOffsetCommitCallback;

// 是否开启了自动提交offset的功能

boolean autoCommitEnabled;

// 自动提交的间隔时间

int autoCommitIntervalMs;

ConsumerInterceptors<?, ?> interceptors;

// 是否排除内部的topic列表

boolean excludeInternalTopics;

// 这个集合必须是线程安全的，因为他会被offset提交请求的response handler修改，他会被心跳线程调用

ConcurrentLinkedQueue<OffsetCommitCompletion>completedOffsetCommits;

// 是否是leader

boolean isLeader = false;

Set<String> joinedSubscription;

// 用来记录元数据变化的新快照

MetadataSnapshot metadataSnapshot;

// 用来存储Metadata的快照信息，不过是用来检测Partition分配过程中有没有发生分区数量的变化

MetadataSnapshot assignmentSnapshot;

// 下一次自动提交的最后期限

long nextAutoCommitDeadline;

二核心方法

# 判断对于这个组的coordinatior是否已经准备好接受请求，否则一直阻塞

public synchronized voidensureCoordinatorReady() {
    while (coordinatorUnknown()) {
        RequestFuture<Void>future = lookupCoordinator();
        client.poll(future);
        // 异常处理
        if (future.failed()) {
            if (future.isRetriable())
                // 阻塞更新metadata中的集群元数据
                client.awaitMetadataUpdate();
            else
                throw future.exception();
        } else if (coordinator!= null && client.connectionFailed(coordinator)) {
            // 如果连接不上GroupCoordinator，则退避一段时间，然后重试
            coordinatorDead();
            time.sleep(retryBackoffMs);
        }
    }
}

# 查找GroupCoordinator,并返回一个请求结果

// 查找GroupCoordinator,并返回一个请求结果protected synchronized RequestFuture<Void> lookupCoordinator() {    if (findCoordinatorFuture == null) {        // 查找集群负载最低的Node节点        Node node = this.client.leastLoadedNode();        // 如果找到了，则调用sendGroupCoordinatorRequest        if (node == null) {            return RequestFuture.noBrokersAvailable();        } else            findCoordinatorFuture = sendGroupCoordinatorRequest(node);    }    return findCoordinatorFuture;}

# 检测心跳线程的状态，他必须加入组后定期调用以确保组成员还在

protected synchronized void pollHeartbeat(long now) {    if (heartbeatThread != null) {        // 如果心跳线程失败，将心跳线程设为空，然后抛出异常，下一次调用ensureActiveGroup在创建一个心跳线程        if (heartbeatThread.hasFailed()) {            // set the heartbeat thread to null and raise an exception. If the user catches it,            // the next call to ensureActiveGroup() will spawn a new heartbeat thread.            RuntimeException cause = heartbeatThread.failureCause();            heartbeatThread = null;            throw cause;        }        // 更新一下heartbeat的lastpoll 时间戳        heartbeat.poll(now);    }}

# 确保组可用

public void ensureActiveGroup() {    // 确保coordinator已经准备好接收请求    ensureCoordinatorReady();    // 开启心跳线程    startHeartbeatThreadIfNeeded();    // 加入组    joinGroupIfNeeded();}

# 进行Join Group操作会初始化JoinGroupRequest，并且发送请求到服务器端

void joinGroupIfNeeded() {    // 是否允许重新加入    while (needRejoin() || rejoinIncomplete()) {        // 再次检测coordinator是否已经准备好        ensureCoordinatorReady();        if (needsJoinPrepare) {            // 进行发送JoinGroupRequest之前的准备            onJoinPrepare(generation.generationId, generation.memberId);            //  needsJoinPrepare置为false，表示已经准备好了            needsJoinPrepare = false;        }        // 初始化        RequestFuture<ByteBuffer> future = initiateJoinGroup();        // 阻塞等待join group的完成        client.poll(future);        // 重置JoinGroup的RequestFuture        resetJoinGroupFuture();        // 如果future成功，则重置needsJoinPrepare状态        if (future.succeeded()) {            needsJoinPrepare = true;            onJoinComplete(generation.generationId, generation.memberId, generation.protocol, future.value());        } else {            RuntimeException exception = future.exception();            if (exception instanceof UnknownMemberIdException ||                    exception instanceof RebalanceInProgressException ||                    exception instanceof IllegalGenerationException)                continue;            else if (!future.isRetriable())                throw exception;            time.sleep(retryBackoffMs);        }    }}

# 初始化JoinGroupRequest请求，然后发送该请求

private synchronized RequestFuture<ByteBuffer> initiateJoinGroup() {    // 我们存储join future，以防止我们在开始rebalance之后，就被用户唤醒    // 这确保了我们不会错误地尝试在尚未完成的再平衡完成之前重新加入。    if (joinFuture == null) {        // 对心跳线程进行明确的隔离，这样它就不会干扰到连接组。        // 注意,这个后必须调用onJoinPrepare因为我们必须能够继续发送心跳,如果回调需要一些时间。        disableHeartbeatThread();        // 更改状态        state = MemberState.REBALANCING;        // 发送JoinGroupRequest，返回RequestFuture对象        joinFuture = sendJoinGroupRequest();        // 针对RequestFuture添加监听器        joinFuture.addListener(new RequestFutureListener<ByteBuffer>() {            @Override            public void onSuccess(ByteBuffer value) {                // 如果成功，则更新状态为消费者客户端已成功加入                synchronized (AbstractCoordinator.this) {                    log.info("Successfully joined group {} with generation {}", groupId, generation.generationId);                    state = MemberState.STABLE;                    // 然后开始心跳检测                    if (heartbeatThread != null)                        heartbeatThread.enable();                }            }            @Override            public void onFailure(RuntimeException e) {                synchronized (AbstractCoordinator.this) {                    state = MemberState.UNJOINED;                }            }        });    }    return joinFuture;}

# 发送JoinGroupRequest

private RequestFuture<ByteBuffer> sendJoinGroupRequest() {    // 检测coordinator是否可用    if (coordinatorUnknown())        return RequestFuture.coordinatorNotAvailable();    // 创建JoinGroupRequest    log.info("(Re-)joining group {}", groupId);    JoinGroupRequest request = new JoinGroupRequest(            groupId,            this.sessionTimeoutMs,            this.rebalanceTimeoutMs,            this.generation.memberId,            protocolType(),        metadata());    log.debug("Sending JoinGroup ({}) to coordinator {}", request, this.coordinator);    // 将这个请求放入unsent集合，等待被发送，并返回一个RequestFuture对象    return client.send(coordinator, ApiKeys.JOIN_GROUP, request)            .compose(new JoinGroupResponseHandler());}

# 发送GroupCoordinator请求

private RequestFuture<Void> sendGroupCoordinatorRequest(Node node) {    // 创建GroupCoordinatorRequest请求    log.debug("Sending coordinator request for group {} to broker {}", groupId, node);    GroupCoordinatorRequest metadataRequest = new GroupCoordinatorRequest(this.groupId);    // ConsumerNetworkClient将创建的GroupCoordinatorRequest请求放入一个unsent列表，等待发送    // 并返回RequestFuture对象，返回的RequestFuture对象经过compose的适配    return client.send(node, ApiKeys.GROUP_COORDINATOR, metadataRequest)                 .compose(new GroupCoordinatorResponseHandler());}

# 发送离开组的请求

public synchronized void maybeLeaveGroup() {    if (!coordinatorUnknown() && state != MemberState.UNJOINED && generation != Generation.NO_GENERATION) {        // this is a minimal effort attempt to leave the group. we do not        // attempt any resending if the request fails or times out.        LeaveGroupRequest request = new LeaveGroupRequest(groupId, generation.memberId);        client.send(coordinator, ApiKeys.LEAVE_GROUP, request)                .compose(new LeaveGroupResponseHandler());        client.pollNoWakeup();    }    resetGeneration();}

# 给Metadata添加监听器

private void addMetadataListener() {    this.metadata.addListener(new Metadata.Listener() {        @Override        public void onMetadataUpdate(Cluster cluster) {            // if we encounter any unauthorized topics, raise an exception to the user            if (!cluster.unauthorizedTopics().isEmpty())                throw new TopicAuthorizationException(new HashSet<>(cluster.unauthorizedTopics()));            if (subscriptions.hasPatternSubscription())                updatePatternSubscription(cluster);            // check if there are any changes to the metadata which should trigger a rebalance            if (subscriptions.partitionsAutoAssigned()) {                MetadataSnapshot snapshot = new MetadataSnapshot(subscriptions, cluster);                if (!snapshot.equals(metadataSnapshot))                    metadataSnapshot = snapshot;            }        }    });}

# 查找指定的分区分配策略

// 查找指定的分区分配策略private PartitionAssignor lookupAssignor(String name) {    for (PartitionAssignor assignor : this.assignors) {        if (assignor.name().equals(name))            return assignor;    }    return null;}

# JoinGroupRequest请求完成之后，需要执行的动作

protected void onJoinComplete(int generation, String memberId,        String assignmentStrategy, ByteBuffer assignmentBuffer) {    // 只有leader才会监控元数据的改变    if (!isLeader)        assignmentSnapshot = null;    // 获取partition分配策略    PartitionAssignor assignor = lookupAssignor(assignmentStrategy);    if (assignor == null)        throw new IllegalStateException("Coordinator selected invalid assignment protocol: " + assignmentStrategy);    // 获取分配结果    Assignment assignment = ConsumerProtocol.deserializeAssignment(assignmentBuffer);    // 设置标记刷新最近一次提交的offset    subscriptions.needRefreshCommits();    // 更新分区的分配    subscriptions.assignFromSubscribed(assignment.partitions());    // 给一个分区分配策略一个机会更新分配结果    assignor.onAssignment(assignment);    // reschedule the auto commit starting from now    this.nextAutoCommitDeadline = time.milliseconds() + autoCommitIntervalMs;    // 执行rebalance之后的回调    ConsumerRebalanceListener listener = subscriptions.listener();    log.info("Setting newly assigned partitions {} for group {}", subscriptions.assignedPartitions(), groupId);    try {        Set<TopicPartition> assigned = new HashSet<>(subscriptions.assignedPartitions());        listener.onPartitionsAssigned(assigned);    } catch (WakeupException e) {        throw e;    } catch (Exception e) {        log.error("User provided listener {} for group {} failed on partition assignment",                listener.getClass().getName(), groupId, e);    }}

# 对协调器事件的轮询。这确保了协调器是已知的，并且是消费者加入了这个群组(如果它使用的是组管理)。这也可以处理周期性的offset提交，如果启用了它们。

public void poll(long now) {    // 调用offset 提交请求的回调函数，如果有    invokeCompletedOffsetCommitCallbacks();    // 判断订阅状态是否自动分配分区且coordinator不为空    if (subscriptions.partitionsAutoAssigned() && coordinatorUnknown()) {        // 确保coordinator已经准备好接收请求了        ensureCoordinatorReady();        now = time.milliseconds();    }    // 判断是否需要重新join    if (needRejoin()) {        // 由于初始元数据获取和初始重新平衡之间的竞争条件，我们需要确保元数据在开始加入之前是新鲜的。        // 确保了我们在join之前至少有一次与集群的主题的模式匹配        if (subscriptions.hasPatternSubscription())            // 刷新元数据            client.ensureFreshMetadata();        // 确保协调器可用，心跳线程开启和组可用        ensureActiveGroup();        now = time.milliseconds();    }    // 检测心跳线程的状态    pollHeartbeat(now);    // 异步的自动提交offset    maybeAutoCommitOffsetsAsync(now);}

# 为消费者组进行分配，主要用于leader向组内所有consumer推送状态

protected Map<String, ByteBuffer> performAssignment(String leaderId,        String assignmentStrategy, Map<String, ByteBuffer> allSubscriptions) {    // 根据partition分配策略    PartitionAssignor assignor = lookupAssignor(assignmentStrategy);    if (assignor == null)        throw new IllegalStateException("Coordinator selected invalid assignment protocol: " + assignmentStrategy);    Set<String> allSubscribedTopics = new HashSet<>();    Map<String, Subscription> subscriptions = new HashMap<>();    for (Map.Entry<String, ByteBuffer> subscriptionEntry : allSubscriptions.entrySet()) {        Subscription subscription = ConsumerProtocol.deserializeSubscription(subscriptionEntry.getValue());        subscriptions.put(subscriptionEntry.getKey(), subscription);        allSubscribedTopics.addAll(subscription.topics());    }    // the leader will begin watching for changes to any of the topics the group is interested in,    // which ensures that all metadata changes will eventually be seen    this.subscriptions.groupSubscribe(allSubscribedTopics);    metadata.setTopics(this.subscriptions.groupSubscription());    // update metadata (if needed) and keep track of the metadata used for assignment so that    // we can check after rebalance completion whether anything has changed    client.ensureFreshMetadata();    isLeader = true;    assignmentSnapshot = metadataSnapshot;    log.debug("Performing assignment for group {} using strategy {} with subscriptions {}",            groupId, assignor.name(), subscriptions);    Map<String, Assignment> assignment = assignor.assign(metadata.fetch(), subscriptions);    log.debug("Finished assignment for group {}: {}", groupId, assignment);    Map<String, ByteBuffer> groupAssignment = new HashMap<>();    for (Map.Entry<String, Assignment> assignmentEntry : assignment.entrySet()) {        ByteBuffer buffer = ConsumerProtocol.serializeAssignment(assignmentEntry.getValue());        groupAssignment.put(assignmentEntry.getKey(), buffer);    }    return groupAssignment;}

# 判断是否需要进行重新join

public boolean needRejoin() {    // 如果不是自动分配partition,不如用户自己指定，则不需要rejoin    if (!subscriptions.partitionsAutoAssigned())        return false;    // 如果我们执行了任务并且元数据改变了，我们需要重新加入    if (assignmentSnapshot != null && !assignmentSnapshot.equals(metadataSnapshot))        return true;    // 如果我们的订阅自上一次join之后改变了，那么我们需要加入    if (joinedSubscription != null && !joinedSubscription.equals(subscriptions.subscription()))        return true;    // 默认需要重新join    return super.needRejoin();}

# 对于一套partition,从协调器中获取当前已提交的偏移量

public void refreshCommittedOffsetsIfNeeded() {    if (subscriptions.refreshCommitsNeeded()) {        // 对于分配的partition,从协调器中获取当前已提交的偏移量        Map<TopicPartition, OffsetAndMetadata> offsets = fetchCommittedOffsets(subscriptions.assignedPartitions());        // 遍历TopicPartition        for (Map.Entry<TopicPartition, OffsetAndMetadata> entry : offsets.entrySet()) {            TopicPartition tp = entry.getKey();            // 验证分配是否是有效的,如果有效，提交offset            if (subscriptions.isAssigned(tp))                this.subscriptions.committed(tp, entry.getValue());        }        // 刷新提交        this.subscriptions.commitsRefreshed();    }}

# 进行发送JoinGroupRequest之前的准备

protected void onJoinPrepare(int generation, String memberId) {    // 如果开启了自动提交，则在rebalance之前进行自动提交offset    maybeAutoCommitOffsetsSync();    // 执行注册在SubscriptionState上的ConsumerRebalanceListener的回调方法    ConsumerRebalanceListener listener = subscriptions.listener();    log.info("Revoking previously assigned partitions {} for group {}", subscriptions.assignedPartitions(), groupId);    try {        Set<TopicPartition> revoked = new HashSet<>(subscriptions.assignedPartitions());        listener.onPartitionsRevoked(revoked);    } catch (WakeupException e) {        throw e;    } catch (Exception e) {        log.error("User provided listener {} for group {} failed on partition revocation",                listener.getClass().getName(), groupId, e);    }    isLeader = false;    // 重置该组的订阅，只包含该用户订阅的主题。    subscriptions.resetGroupSubscription();}

阅读全文

0 0