Kafka和Storm的整合

主要难点在于实现一个KafkaSpout，用于Storm接收从Kafka传来的消息

//发送第一步，加入需要发送列表中

protected void setWaitingToEmit(ConsumerRecords consumerRecords) {

for (TopicPartition tp : consumerRecords.partitions()) {

waitingToEmit.put(tp, new ArrayList<>(consumerRecords.records(tp)));

}

protected void emitIfWaitingNotEmitted() {

//从waitingToEmit列表获取将要发送的事件，开始发送

Iterator>> waitingToEmitIter = waitingToEmit.values().iterator();

LOG.info("real event emit begin");

outerLoop:

while (waitingToEmitIter.hasNext()) {

List> waitingToEmitForTp = waitingToEmitIter.next();

while (!waitingToEmitForTp.isEmpty()) {

final boolean emittedTuple = emitOrRetryTuple(waitingToEmitForTp.remove(0));

if (emittedTuple) {

LOG.error("event emit has failed");

break outerLoop;

}

waitingToEmitIter.remove();

}

//实际发送过程

private boolean emitOrRetryTuple(ConsumerRecord record) {

final TopicPartition tp = new TopicPartition(record.topic(), record.partition());

final KafkaSpoutMessageId msgId = retryService.getMessageId(record);

if (offsetManagers.containsKey(tp) && offsetManagers.get(tp).contains(msgId)) { // has been acked

LOG.trace("Tuple for record [{}] has already been acked. Skipping", record);

} else if (emitted.contains(msgId)) { // has been emitted and it is pending ack or fail

LOG.trace("Tuple for record [{}] has already been emitted. Skipping", record);

} else {

final OffsetAndMetadata committedOffset = kafkaConsumer.committed(tp);

if (isAtLeastOnceProcessing()

&& committedOffset != null

&& committedOffset.offset() > record.offset()

&& commitMetadataManager.isOffsetCommittedByThisTopology(tp, committedOffset, Collections.unmodifiableMap(offsetManagers))) {

// Ensures that after a topology with this id is started, the consumer fetch

// position never falls behind the committed offset (STORM-2844)

throw new IllegalStateException("Attempting to emit a message that has already been committed."

+ " This should never occur when using the at-least-once processing guarantee.");

}

final List

if (isEmitTuple(tuple)) {

final boolean isScheduled = retryService.isScheduled(msgId);

// not scheduled <=> never failed (i.e. never emitted), or scheduled and ready to be retried

if (!isScheduled || retryService.isReady(msgId)) {

final String stream = tuple instanceof KafkaTuple ? ((KafkaTuple) tuple).getStream() : Utils.DEFAULT_STREAM_ID;

if (!isAtLeastOnceProcessing()) {

if (kafkaSpoutConfig.isTupleTrackingEnforced()) {

collector.emit(stream, tuple, msgId);

LOG.trace("Emitted tuple [{}] for record [{}] with msgId [{}]", tuple, record, msgId);

} else {

collector.emit(stream, tuple);

LOG.trace("Emitted tuple [{}] for record [{}]", tuple, record);

}

} else {

emitted.add(msgId);

offsetManagers.get(tp).addToEmitMsgs(msgId.offset());

if (isScheduled) { // Was scheduled for retry and re-emitted, so remove from schedule.

retryService.remove(msgId);

}

collector.emit(stream, tuple, msgId);

tupleListener.onEmit(tuple, msgId);

LOG.trace("Emitted tuple [{}] for record [{}] with msgId [{}]", tuple, record, msgId);

}

return true;

}

} else {

/*if a null tuple is not configured to be emitted, it should be marked as emitted and acked immediately

* to allow its offset to be commited to Kafka*/

LOG.debug("Not emitting null tuple for record [{}] as defined in configuration.", record);

if (isAtLeastOnceProcessing()) {

msgId.setNullTuple(true);

offsetManagers.get(tp).addToEmitMsgs(msgId.offset());

ack(msgId);

}

return false;

}

热门新闻

周热门

Kafka和Storm的整合

这个Python资源在GitHub上标星超8000，现在被翻译成了中文｜资源

热搜丨第一批90后马上就30了...00、10后来捣乱le...

参战黑五必备英语

航运业内又一压载水专家崛起——LeesGreen！！

2019国际广告及标识智能生态展览会将于3月在广州举行

联想Lecoo智能体脂秤开箱评测：一次上秤可检测获得20项身体数据

小小的建筑也能容纳大大的梦想，快来看看梯间美术馆的妙处！

十年，期待中法之城

大众艺术网：他是雷恩市市长奖获得者 —— 法国现代具象主义画家 Jean Le Merdy 绘画作品

《极品飞车》，你还在玩吗？Khyzyl Saleem作品赏

它曾因“太胖”遭人遗弃，但如今……却狗生大逆转！

《你好，旧时光》：My Huckleberry Friends

胖成个球的狗狗被前主人丢弃在路边，事后竟是被她带回了家……

Cardi B和Offset离婚：脱衣舞娘和古惑仔终究没能天长地久…

潮流 | 小贾海莉夫妻上《Vogue》，Cardi B产后4个月就离婚了？

热门新闻

周热门