获取kafka lags

这个问题看上去很简单,但 “得益” 于 kafka-python 神奇的文档,真的不算简单,反正我是搜了半天还看了半天源码。直接上代码吧

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
from kafka import SimpleClient, KafkaConsumer
from kafka.common import OffsetRequestPayload, TopicPartition

def get_topic_offset(brokers, topic):
"""
获取一个topic的offset值的和
"""
client = SimpleClient(brokers)
partitions = client.topic_partitions[topic]
offset_requests = [OffsetRequestPayload(topic, p, -1, 1) for p in partitions.keys()]
offsets_responses = client.send_offset_request(offset_requests)
return sum([r.offsets[0] for r in offsets_responses])


def get_group_offset(brokers, group_id, topic):
"""
获取一个topic特定group已经消费的offset值的和
"""
consumer = KafkaConsumer(bootstrap_servers=brokers,
group_id=group_id,
)
pts = [TopicPartition(topic=topic, partition=i) for i in
consumer.partitions_for_topic(topic)]
result = consumer._coordinator.fetch_committed_offsets(pts)
return sum([r.offset for r in result.values()])


if __name__ == '__main__':
topic_offset = get_topic_offset("localhost:9092", "r_liveserverhosts")
group_offset = get_group_offset("localhost:9092", "logstash", "r_liveserverhosts")
lag = topic_offset - group_offset
print(topic_offset)
print(group_offset)
print(lag)