diff --git a/examples/src/main/java/org/apache/spark/examples/sql/streaming/JavaStructuredNetworkWordCount.java b/examples/src/main/java/org/apache/spark/examples/sql/streaming/JavaStructuredNetworkWordCount.java index 99b7029b774d5..5a75189a8513e 100644 --- a/examples/src/main/java/org/apache/spark/examples/sql/streaming/JavaStructuredNetworkWordCount.java +++ b/examples/src/main/java/org/apache/spark/examples/sql/streaming/JavaStructuredNetworkWordCount.java @@ -19,8 +19,6 @@ import org.apache.spark.sql.*; import org.apache.spark.sql.streaming.StreamingQuery; -import java.util.regex.Pattern; - /** * Counts words in UTF8 encoded, '\n' delimited text received from the network every second. * @@ -34,7 +32,6 @@ * localhost 9999 ` */ public final class JavaStructuredNetworkWordCount { - private static final Pattern SPACE = Pattern.compile(" "); public static void main(String[] args) throws Exception { if (args.length < 3) { @@ -60,11 +57,11 @@ public static void main(String[] args) throws Exception { .load(); // Split the lines into words - Dataset words = lines.select( - functions.explode( - functions.split(lines.col("value"), " ") - ).alias("word") - ).as(Encoders.STRING()); + Dataset words = lines.select( + functions.explode( + functions.split(lines.col("value"), " ") + ).alias("word") + ); // Generate running word count Dataset wordCounts = words.groupBy("word").count(); diff --git a/examples/src/main/scala/org/apache/spark/examples/sql/streaming/StructuredNetworkWordCount.scala b/examples/src/main/scala/org/apache/spark/examples/sql/streaming/StructuredNetworkWordCount.scala index b63010a324d9e..96fa5cd1c8c8c 100644 --- a/examples/src/main/scala/org/apache/spark/examples/sql/streaming/StructuredNetworkWordCount.scala +++ b/examples/src/main/scala/org/apache/spark/examples/sql/streaming/StructuredNetworkWordCount.scala @@ -60,7 +60,8 @@ object StructuredNetworkWordCount { val words = lines.select( explode( split(lines.col("value"), " ") - ).alias("word")) + ).alias("word") + ) // Generate running word count val wordCounts = words.groupBy("word").count()