From 4af272de6dd9146fa7cf117c6d1bd3245ebedb57 Mon Sep 17 00:00:00 2001 From: Christiam Camacho Date: Tue, 1 Aug 2017 12:30:06 -0400 Subject: [PATCH 1/2] Fix Java SimpleApp spark application --- docs/quick-start.md | 7 ++++++- 1 file changed, 6 insertions(+), 1 deletion(-) diff --git a/docs/quick-start.md b/docs/quick-start.md index 7cb3f75132206..d702b9d9118af 100644 --- a/docs/quick-start.md +++ b/docs/quick-start.md @@ -297,12 +297,13 @@ We'll create a very simple Spark application, `SimpleApp.java`: {% highlight java %} /* SimpleApp.java */ import org.apache.spark.sql.SparkSession; +import org.apache.spark.sql.Dataset; public class SimpleApp { public static void main(String[] args) { String logFile = "YOUR_SPARK_HOME/README.md"; // Should be some file on your system SparkSession spark = SparkSession.builder().appName("Simple Application").getOrCreate(); - Dataset logData = spark.read.textFile(logFile).cache(); + Dataset logData = spark.read().textFile(logFile).cache(); long numAs = logData.filter(s -> s.contains("a")).count(); long numBs = logData.filter(s -> s.contains("b")).count(); @@ -330,6 +331,10 @@ Note that Spark artifacts are tagged with a Scala version. Simple Project jar 1.0 + + 1.8 + 1.8 + org.apache.spark From 74717812ec6488028647afd5793ba80cff423e9c Mon Sep 17 00:00:00 2001 From: Christiam Camacho Date: Wed, 2 Aug 2017 07:16:42 -0400 Subject: [PATCH 2/2] Additional fixes for Java --- docs/quick-start.md | 4 ---- docs/structured-streaming-programming-guide.md | 6 +++--- 2 files changed, 3 insertions(+), 7 deletions(-) diff --git a/docs/quick-start.md b/docs/quick-start.md index d702b9d9118af..a85e5b28a6996 100644 --- a/docs/quick-start.md +++ b/docs/quick-start.md @@ -331,10 +331,6 @@ Note that Spark artifacts are tagged with a Scala version. Simple Project jar 1.0 - - 1.8 - 1.8 - org.apache.spark diff --git a/docs/structured-streaming-programming-guide.md b/docs/structured-streaming-programming-guide.md index 8f64faadc32dc..8367f5a08c755 100644 --- a/docs/structured-streaming-programming-guide.md +++ b/docs/structured-streaming-programming-guide.md @@ -1041,8 +1041,8 @@ streamingDf.join(staticDf, "type", "right_join") // right outer join with a sta
{% highlight java %} -Dataset staticDf = spark.read. ...; -Dataset streamingDf = spark.readStream. ...; +Dataset staticDf = spark.read(). ...; +Dataset streamingDf = spark.readStream(). ...; streamingDf.join(staticDf, "type"); // inner equi-join with a static DF streamingDf.join(staticDf, "type", "right_join"); // right outer join with a static DF {% endhighlight %} @@ -1087,7 +1087,7 @@ streamingDf
{% highlight java %} -Dataset streamingDf = spark.readStream. ...; // columns: guid, eventTime, ... +Dataset streamingDf = spark.readStream(). ...; // columns: guid, eventTime, ... // Without watermark using guid column streamingDf.dropDuplicates("guid");