X-Git-Url: http://juplo.de/gitweb/?a=blobdiff_plain;f=src%2Fmain%2Fjava%2Fde%2Fjuplo%2Fkafka%2FEndlessConsumer.java;h=c79b1e0c7ad9466bd7e5f514eeb01a8841153176;hb=7d46d2df2b323e0f4df2e7b5f15706840de4b804;hp=18cef23c16b96c723559f8bd79f6ad2106a41e16;hpb=014de600554a5f9ba620fdadb8581b5882bc4d20;p=demos%2Fkafka%2Ftraining diff --git a/src/main/java/de/juplo/kafka/EndlessConsumer.java b/src/main/java/de/juplo/kafka/EndlessConsumer.java index 18cef23..c79b1e0 100644 --- a/src/main/java/de/juplo/kafka/EndlessConsumer.java +++ b/src/main/java/de/juplo/kafka/EndlessConsumer.java @@ -1,16 +1,17 @@ package de.juplo.kafka; import lombok.extern.slf4j.Slf4j; +import org.apache.kafka.clients.consumer.ConsumerRebalanceListener; import org.apache.kafka.clients.consumer.ConsumerRecord; import org.apache.kafka.clients.consumer.ConsumerRecords; import org.apache.kafka.clients.consumer.KafkaConsumer; +import org.apache.kafka.common.TopicPartition; import org.apache.kafka.common.errors.WakeupException; import org.apache.kafka.common.serialization.StringDeserializer; import javax.annotation.PreDestroy; import java.time.Duration; -import java.util.Arrays; -import java.util.Properties; +import java.util.*; import java.util.concurrent.ExecutionException; import java.util.concurrent.ExecutorService; import java.util.concurrent.locks.Condition; @@ -22,6 +23,7 @@ import java.util.concurrent.locks.ReentrantLock; public class EndlessConsumer implements Runnable { private final ExecutorService executor; + private final PartitionStatisticsRepository repository; private final String bootstrapServer; private final String groupId; private final String id; @@ -31,12 +33,17 @@ public class EndlessConsumer implements Runnable private final Lock lock = new ReentrantLock(); private final Condition condition = lock.newCondition(); private boolean running = false; + private Exception exception; private long consumed = 0; private KafkaConsumer consumer = null; + private final Map> seen = new HashMap<>(); + + public EndlessConsumer( ExecutorService executor, + PartitionStatisticsRepository repository, String bootstrapServer, String groupId, String clientId, @@ -44,6 +51,7 @@ public class EndlessConsumer implements Runnable String autoOffsetReset) { this.executor = executor; + this.repository = repository; this.bootstrapServer = bootstrapServer; this.groupId = groupId; this.id = clientId; @@ -60,14 +68,52 @@ public class EndlessConsumer implements Runnable props.put("bootstrap.servers", bootstrapServer); props.put("group.id", groupId); props.put("client.id", id); + props.put("enable.auto.commit", false); props.put("auto.offset.reset", autoOffsetReset); + props.put("metadata.max.age.ms", "1000"); props.put("key.deserializer", StringDeserializer.class.getName()); props.put("value.deserializer", StringDeserializer.class.getName()); this.consumer = new KafkaConsumer<>(props); log.info("{} - Subscribing to topic {}", id, topic); - consumer.subscribe(Arrays.asList(topic)); + consumer.subscribe(Arrays.asList(topic), new ConsumerRebalanceListener() + { + @Override + public void onPartitionsRevoked(Collection partitions) + { + partitions.forEach(tp -> + { + log.info("{} - removing partition: {}", id, tp); + Map removed = seen.remove(tp.partition()); + for (String key : removed.keySet()) + { + log.info( + "{} - Seen {} messages for partition={}|key={}", + id, + removed.get(key), + tp.partition(), + key); + } + repository.save(new StatisticsDocument(tp.partition(), removed, consumer.position(tp))); + }); + } + + @Override + public void onPartitionsAssigned(Collection partitions) + { + partitions.forEach(tp -> + { + log.info("{} - adding partition: {}", id, tp); + StatisticsDocument document = + repository + .findById(Integer.toString(tp.partition())) + .orElse(new StatisticsDocument(tp.partition())); + consumer.seek(tp, document.offset); + seen.put(tp.partition(), document.statistics); + }); + } + }); while (true) { @@ -88,7 +134,24 @@ public class EndlessConsumer implements Runnable record.key(), record.value() ); + + Integer partition = record.partition(); + String key = record.key() == null ? "NULL" : record.key(); + Map byKey = seen.get(partition); + + if (!byKey.containsKey(key)) + byKey.put(key, 0); + + int seenByKey = byKey.get(key); + seenByKey++; + byKey.put(key, seenByKey); } + + seen.forEach((partiton, statistics) -> repository.save( + new StatisticsDocument( + partiton, + statistics, + consumer.position(new TopicPartition(topic, partiton))))); } } catch(WakeupException e) @@ -99,7 +162,7 @@ public class EndlessConsumer implements Runnable catch(Exception e) { log.error("{} - Unexpected error: {}", id, e.toString(), e); - shutdown(); + shutdown(e); } finally { @@ -110,11 +173,17 @@ public class EndlessConsumer implements Runnable } private void shutdown() + { + shutdown(null); + } + + private void shutdown(Exception e) { lock.lock(); try { running = false; + exception = e; condition.signal(); } finally @@ -123,6 +192,11 @@ public class EndlessConsumer implements Runnable } } + public Map> getSeen() + { + return seen; + } + public void start() { lock.lock(); @@ -133,6 +207,7 @@ public class EndlessConsumer implements Runnable log.info("{} - Starting - consumed {} messages before", id, consumed); running = true; + exception = null; executor.submit(this); } finally @@ -181,4 +256,33 @@ public class EndlessConsumer implements Runnable log.info("{}: Consumed {} messages in total, exiting!", id, consumed); } } + + public boolean running() + { + lock.lock(); + try + { + return running; + } + finally + { + lock.unlock(); + } + } + + public Optional exitStatus() + { + lock.lock(); + try + { + if (running) + throw new IllegalStateException("No exit-status available: Consumer instance " + id + " is running!"); + + return Optional.ofNullable(exception); + } + finally + { + lock.unlock(); + } + } }