miguno · November 29, 2017 20:10 · Rtowne-Janrain · Apr 13, 2017 · ardlema · Aug 1, 2017
diff --git a/WordCountApp.scala b/WordCountApp.scala
 import java.lang.Long
 import java.util.Properties
 import java.util.concurrent.TimeUnit

 import org.apache.kafka.common.serialization._
 import org.apache.kafka.streams._
 import org.apache.kafka.streams.kstream.{KStream, KStreamBuilder, KTable}

 import scala.collection.JavaConverters.asJavaIterableConverter

 // This Scala application is elastic, scalable, distributed (if need be), and fault-tolerant.
 // The code below can be used in production to count millions of words per second.
 // How it works: http://docs.confluent.io/current/streams/developer-guide.html
 // More examples and demo applications: https://github.com/confluentinc/examples
 object WordCountApplication {

  def main(args: Array[String]) {
    val streamsConfiguration: Properties = {
      val p = new Properties()
      p.put(StreamsConfig.APPLICATION_ID_CONFIG, "word-count-scala")
      p.put(StreamsConfig.BOOTSTRAP_SERVERS_CONFIG, "kafka-broker1:9092")
      p.put(StreamsConfig.KEY_SERDE_CLASS_CONFIG, Serdes.String.getClass.getName)
      p.put(StreamsConfig.VALUE_SERDE_CLASS_CONFIG, Serdes.String.getClass.getName)
      p
    }
    val stringSerde: Serde[String] = Serdes.String()
    val longSerde: Serde[Long] = Serdes.Long()

    val builder: KStreamBuilder = new KStreamBuilder()
    val textLines: KStream[String, String] = builder.stream("input-topic")
    val wordCounts: KTable[String, Long] = textLines
        .flatMapValues(textLine => textLine.toLowerCase.split("\\W+").toIterable.asJava)
        .groupBy((_, word) => word)
        .count("word-counts")
    wordCounts.to(stringSerde, longSerde, "output-topic")

    val streams: KafkaStreams = new KafkaStreams(builder, streamsConfiguration)
    streams.start()

    Runtime.getRuntime.addShutdownHook(new Thread(() => {
      streams.close(10, TimeUnit.SECONDS)
    }))
  }

 }
	import java.lang.Long
	import java.util.Properties
	import java.util.concurrent.TimeUnit

	import org.apache.kafka.common.serialization._
	import org.apache.kafka.streams._
	import org.apache.kafka.streams.kstream.{KStream, KStreamBuilder, KTable}

	import scala.collection.JavaConverters.asJavaIterableConverter

	// This Scala application is elastic, scalable, distributed (if need be), and fault-tolerant.
	// The code below can be used in production to count millions of words per second.
	// How it works: http://docs.confluent.io/current/streams/developer-guide.html
	// More examples and demo applications: https://github.com/confluentinc/examples
	object WordCountApplication {

	def main(args: Array[String]) {
	val streamsConfiguration: Properties = {
	val p = new Properties()
	p.put(StreamsConfig.APPLICATION_ID_CONFIG, "word-count-scala")
	p.put(StreamsConfig.BOOTSTRAP_SERVERS_CONFIG, "kafka-broker1:9092")
	p.put(StreamsConfig.KEY_SERDE_CLASS_CONFIG, Serdes.String.getClass.getName)
	p.put(StreamsConfig.VALUE_SERDE_CLASS_CONFIG, Serdes.String.getClass.getName)
	p
	}
	val stringSerde: Serde[String] = Serdes.String()
	val longSerde: Serde[Long] = Serdes.Long()

	val builder: KStreamBuilder = new KStreamBuilder()
	val textLines: KStream[String, String] = builder.stream("input-topic")
	val wordCounts: KTable[String, Long] = textLines
	.flatMapValues(textLine => textLine.toLowerCase.split("\\W+").toIterable.asJava)
	.groupBy((_, word) => word)
	.count("word-counts")
	wordCounts.to(stringSerde, longSerde, "output-topic")

	val streams: KafkaStreams = new KafkaStreams(builder, streamsConfiguration)
	streams.start()

	Runtime.getRuntime.addShutdownHook(new Thread(() => {
	streams.close(10, TimeUnit.SECONDS)
	}))
	}

	}