spring-cloud · jukkakarvanen · Apr 9, 2019 · Apr 9, 2019 · Apr 9, 2019 · Apr 9, 2019
diff --git a/kafka-streams-samples/kafka-streams-word-count/pom.xml b/kafka-streams-samples/kafka-streams-word-count/pom.xml
@@ -17,6 +17,11 @@
 		<relativePath>../..</relativePath>
 	</parent>
 
+	<properties>
+		<!-- This should be kept in sync with spring-kafka-test kafka version -->
+		<kafka.version>2.0.1</kafka.version>
+	</properties>
+
 	<dependencies>
 		<dependency>
 			<groupId>org.springframework.cloud</groupId>
@@ -36,6 +41,12 @@
 			<artifactId>spring-kafka-test</artifactId>
             <scope>test</scope>
 		</dependency>
+		<dependency>
+			<groupId>org.apache.kafka</groupId>
+			<artifactId>kafka-streams-test-utils</artifactId>
+			<version>${kafka.version}</version>
+			<scope>test</scope>
+		</dependency>
 	</dependencies>
 
     <build>

diff --git a/...s-word-count/src/main/java/kafka/streams/word/count/KafkaStreamsWordCountApplication.java b/...s-word-count/src/main/java/kafka/streams/word/count/KafkaStreamsWordCountApplication.java
@@ -17,6 +17,7 @@
 package kafka.streams.word.count;
 
 import org.apache.kafka.common.serialization.Serdes;
+import org.apache.kafka.common.utils.Bytes;
 import org.apache.kafka.streams.KeyValue;
 import org.apache.kafka.streams.kstream.KStream;
 import org.apache.kafka.streams.kstream.Materialized;
@@ -42,15 +43,19 @@ public static void main(String[] args) {
 	@EnableBinding(KafkaStreamsProcessor.class)
 	public static class WordCountProcessorApplication {
 
-		@StreamListener("input")
-		@SendTo("output")
-		public KStream<?, WordCount> process(KStream<Object, String> input) {
+		public static final String INPUT_TOPIC = "input";
+		public static final String OUTPUT_TOPIC = "output";
+		public static final int WINDOW_SIZE_MS = 30000;
+
+		@StreamListener(INPUT_TOPIC)
+		@SendTo(OUTPUT_TOPIC)
+		public KStream<Bytes, WordCount> process(KStream<Bytes, String> input) {
 
 			return input
 					.flatMapValues(value -> Arrays.asList(value.toLowerCase().split("\\W+")))
 					.map((key, value) -> new KeyValue<>(value, value))
 					.groupByKey(Serialized.with(Serdes.String(), Serdes.String()))
-					.windowedBy(TimeWindows.of(30000))
+					.windowedBy(TimeWindows.of(WINDOW_SIZE_MS))
 					.count(Materialized.as("WordCounts-1"))
 					.toStream()
 					.map((key, value) -> new KeyValue<>(null, new WordCount(key.key(), value, new Date(key.window().start()), new Date(key.window().end()))));
@@ -67,6 +72,19 @@ static class WordCount {
 
 		private Date end;
 
+		@Override
+		public String toString() {
+			final StringBuffer sb = new StringBuffer("WordCount{");
+			sb.append("word='").append(word).append('\'');
+			sb.append(", count=").append(count);
+			sb.append(", start=").append(start);
+			sb.append(", end=").append(end);
+			sb.append('}');
+			return sb.toString();
+		}
+
+		WordCount() {}
+
 		WordCount(String word, long count, Date start, Date end) {
 			this.word = word;
 			this.count = count;

diff --git a/kafka-streams-samples/kafka-streams-word-count/src/main/resources/logback.xml b/kafka-streams-samples/kafka-streams-word-count/src/main/resources/logback.xml
@@ -0,0 +1,12 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<configuration>
+    <appender name="stdout" class="ch.qos.logback.core.ConsoleAppender">
+        <encoder>
+            <pattern>%d{ISO8601} %5p %t %c{2}:%L - %m%n</pattern>
+        </encoder>
+    </appender>
+    <root level="INFO">
+        <appender-ref ref="stdout"/>
+    </root>
+    <logger name="org.apache.kafka.streams.processor.internals" level="WARN"/>
+</configuration>
diff --git a/...word-count/src/test/java/kafka/streams/word/count/WordCountProcessorApplicationTests.java b/...word-count/src/test/java/kafka/streams/word/count/WordCountProcessorApplicationTests.java
@@ -0,0 +1,163 @@
+/*
+ * Copyright 2019 the original author or authors.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ *      https://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+package kafka.streams.word.count;
+
+import org.apache.kafka.clients.producer.ProducerRecord;
+import org.apache.kafka.common.serialization.*;
+import org.apache.kafka.common.utils.Bytes;
+import org.apache.kafka.streams.KeyValue;
+import org.apache.kafka.streams.StreamsBuilder;
+import org.apache.kafka.streams.StreamsConfig;
+import org.apache.kafka.streams.TopologyTestDriver;
+import org.apache.kafka.streams.kstream.Consumed;
+import org.apache.kafka.streams.kstream.KStream;
+import org.apache.kafka.streams.kstream.Produced;
+import org.apache.kafka.streams.test.ConsumerRecordFactory;
+import org.apache.kafka.streams.test.OutputVerifier;
+import org.junit.After;
+import org.junit.Before;
+import org.junit.Test;
+import org.springframework.kafka.support.serializer.JsonDeserializer;
+import org.springframework.kafka.support.serializer.JsonSerde;
+
+import java.util.*;
+import java.util.stream.Collectors;
+
+import static org.assertj.core.api.Assertions.assertThat;
+
+
+
+/**
+ * TopologyTestDriver based test about stream processing of {@link KafkaStreamsWordCountApplication}
+ *
+ * @author Jukka Karvanen / jukinimi.com
+ */
+
+public class WordCountProcessorApplicationTests {
+    private TopologyTestDriver testDriver;
+    public static final String INPUT_TOPIC = KafkaStreamsWordCountApplication.WordCountProcessorApplication.INPUT_TOPIC;
+    public static final String OUTPUT_TOPIC = KafkaStreamsWordCountApplication.WordCountProcessorApplication.OUTPUT_TOPIC;
+
+    final Serde<String> stringSerde = Serdes.String();
+    final JsonSerde<KafkaStreamsWordCountApplication.WordCount> countSerde = new JsonSerde<>(KafkaStreamsWordCountApplication.WordCount.class);
+    final Serde<Bytes> nullSerde = Serdes.Bytes(); //Serde for not used key
+    private ConsumerRecordFactory<String, String> recordFactory = new ConsumerRecordFactory<>(
+            stringSerde.serializer(), stringSerde.serializer()); //Key feed in as string, even read as Bytes
+
+    static Properties getStreamsConfiguration() {
+        final Properties streamsConfiguration = new Properties();
+        // Need to be set even these do not matter with TopologyTestDriver
+        streamsConfiguration.put(StreamsConfig.APPLICATION_ID_CONFIG, "TopologyTestDriver");
+        streamsConfiguration.put(StreamsConfig.BOOTSTRAP_SERVERS_CONFIG, "localhost:9092");
+        return streamsConfiguration;
+    }
+
+    /**
+     * Setup Stream topology
+     * Add KStream based on @StreamListener annotation
+     * Add to(topic) based @SendTo annotation
+     */
+    @Before
+    public void setup() {
+        final StreamsBuilder builder = new StreamsBuilder();
+        KStream<Bytes, String> input = builder.stream(INPUT_TOPIC, Consumed.with(nullSerde, stringSerde));
+        KafkaStreamsWordCountApplication.WordCountProcessorApplication app = new KafkaStreamsWordCountApplication.WordCountProcessorApplication();
+        KStream<Bytes, KafkaStreamsWordCountApplication.WordCount> output = app.process(input);
+        output.to(OUTPUT_TOPIC, Produced.with(nullSerde, countSerde));
+        testDriver = new TopologyTestDriver(builder.build(), getStreamsConfiguration());
+    }
+
+    @After
+    public void tearDown() {
+        try {
+            testDriver.close();
+        } catch (final RuntimeException e) {
+            // https://issues.apache.org/jira/browse/KAFKA-6647 causes exception when executed in Windows, ignoring it
+            // Logged stacktrace cannot be avoided
+            System.out.println("Ignoring exception, test failing in Windows due this exception:" + e.getLocalizedMessage());
+        }
+    }
+
+    /**
+     * Read one Record from output topic.
+     *
+     * @return ProducerRecord containing WordCount as value
+     */
+    private ProducerRecord<Bytes, KafkaStreamsWordCountApplication.WordCount> readOutput() {
+        return testDriver.readOutput(OUTPUT_TOPIC, nullSerde.deserializer(), countSerde.deserializer());
+    }
+
+    /**
+     * Read counts from output to map ignoring start and end dates
+     * If existing word is incremented, it can appear twice in output and is replaced in map
+     *
+     * @return Map of Word and counts
+     */
+    private Map<String, Long> getOutputList() {
+        final Map<String, Long> output = new HashMap<>();
+        ProducerRecord<Bytes, KafkaStreamsWordCountApplication.WordCount> outputRow;
+        while ((outputRow = readOutput()) != null) {
+            output.put(outputRow.value().getWord(), outputRow.value().getCount());
+        }
+        return output;
+    }
+
+    /**
+     * Simple test validating count of one word
+     */
+    @Test
+    public void testOneWord() {
+        final String nullKey = null;
+        //Feed word "Hello" to inputTopic and no kafka key, timestamp is irrelevant in this case
+        testDriver.pipeInput(recordFactory.create(INPUT_TOPIC, nullKey, "Hello", 1L));
+        //Read and validate output
+        final ProducerRecord<Bytes, KafkaStreamsWordCountApplication.WordCount> output = readOutput();
+        assertThat(output).isNotNull();
+        assertThat(output.value()).isEqualToComparingFieldByField(new KafkaStreamsWordCountApplication.WordCount("hello", 1L, new Date(0), new Date(KafkaStreamsWordCountApplication.WordCountProcessorApplication.WINDOW_SIZE_MS)));
+        //No more output in topic
+        assertThat(readOutput()).isNull();
+    }
+
+    /**
+     * Test Word count of sentence list.
+     */
+    @Test
+    public void shouldCountWords() {
+        final List<String> inputLines = Arrays.asList(
+                "Kafka Streams Examples",
+                "Spring Cloud Stream Sample",
+                "Using Kafka Streams Test Utils"
+        );
+        final List<KeyValue<String, String>> inputRecords = inputLines.stream().map(v -> new KeyValue<String, String>(null, v)).collect(Collectors.toList());
+
+        final Map<String, Long> expectedWordCounts = new HashMap<>();
+        expectedWordCounts.put("spring", 1L);
+        expectedWordCounts.put("cloud", 1L);
+        expectedWordCounts.put("examples", 1L);
+        expectedWordCounts.put("sample", 1L);
+        expectedWordCounts.put("streams", 2L);
+        expectedWordCounts.put("stream", 1L);
+        expectedWordCounts.put("test", 1L);
+        expectedWordCounts.put("utils", 1L);
+        expectedWordCounts.put("kafka", 2L);
+        expectedWordCounts.put("using", 1L);
+
+        testDriver.pipeInput(recordFactory.create(INPUT_TOPIC, inputRecords, 1L, 1000L)); //All feed in same 30s time window
+        final Map<String, Long> actualWordCounts = getOutputList();
+        assertThat(actualWordCounts).containsAllEntriesOf(expectedWordCounts).hasSameSizeAs(expectedWordCounts);
+    }
+}