X-Git-Url: https://juplo.de/gitweb/?a=blobdiff_plain;f=src%2Fmain%2Fjava%2Fde%2Fjuplo%2Fkafka%2Fwordcount%2Fsplitter%2FSplitterStreamProcessor.java;h=12816ab4e27d8a111f24b683afefcb9835981e85;hb=refs%2Ftags%2Fsplitter-1.1.0;hp=7218d6f2e94e44e5338de1d55854a9ed7255eeaa;hpb=3bc3ef7ceb76e7643e1e373293cfdc78f870838a;p=demos%2Fkafka%2Fwordcount diff --git a/src/main/java/de/juplo/kafka/wordcount/splitter/SplitterStreamProcessor.java b/src/main/java/de/juplo/kafka/wordcount/splitter/SplitterStreamProcessor.java index 7218d6f..12816ab 100644 --- a/src/main/java/de/juplo/kafka/wordcount/splitter/SplitterStreamProcessor.java +++ b/src/main/java/de/juplo/kafka/wordcount/splitter/SplitterStreamProcessor.java @@ -6,13 +6,16 @@ import org.apache.kafka.common.serialization.Serdes; import org.apache.kafka.streams.KafkaStreams; import org.apache.kafka.streams.StreamsBuilder; import org.apache.kafka.streams.StreamsConfig; +import org.apache.kafka.streams.kstream.Consumed; import org.apache.kafka.streams.kstream.KStream; +import org.apache.kafka.streams.kstream.Produced; import org.springframework.boot.SpringApplication; import org.springframework.context.ConfigurableApplicationContext; +import org.springframework.kafka.support.serializer.JsonSerde; import org.springframework.stereotype.Component; -import javax.annotation.PostConstruct; -import javax.annotation.PreDestroy; +import jakarta.annotation.PostConstruct; +import jakarta.annotation.PreDestroy; import java.util.Arrays; import java.util.Properties; import java.util.concurrent.CompletableFuture; @@ -36,16 +39,27 @@ public class SplitterStreamProcessor { StreamsBuilder builder = new StreamsBuilder(); - KStream source = builder.stream(properties.getInputTopic()); + JsonSerde recordSerde = + new JsonSerde<>(Recording.class).ignoreTypeHeaders(); + JsonSerde wordSerde = + new JsonSerde<>(Word.class).noTypeInfo(); + + KStream source = builder.stream( + properties.getInputTopic(), + Consumed.with(Serdes.String(), recordSerde)); + source - .flatMapValues(sentence -> Arrays.asList(PATTERN.split(sentence))) - .to(properties.getOutputTopic()); + .flatMapValues(recording -> Arrays + .stream(PATTERN.split(recording.getSentence())) + .map(word -> Word.of(recording.getUser(), word)) + .toList()) + .to(properties.getOutputTopic(), Produced.with(Serdes.String(), wordSerde)); Properties props = new Properties(); props.put(StreamsConfig.APPLICATION_ID_CONFIG, properties.getApplicationId()); props.put(StreamsConfig.BOOTSTRAP_SERVERS_CONFIG, properties.getBootstrapServer()); props.put(StreamsConfig.DEFAULT_KEY_SERDE_CLASS_CONFIG, Serdes.String().getClass().getName()); - props.put(StreamsConfig.DEFAULT_VALUE_SERDE_CLASS_CONFIG, Serdes.String().getClass().getName()); + props.put(StreamsConfig.DEFAULT_VALUE_SERDE_CLASS_CONFIG, JsonSerde.class.getName()); props.put(ConsumerConfig.AUTO_OFFSET_RESET_CONFIG, "earliest"); streams = new KafkaStreams(builder.build(), props);