From e0fc9c7e59848cb78f8d598898bfca004a3710d8 Mon Sep 17 00:00:00 2001 From: Wenchen Fan Date: Wed, 4 Nov 2015 09:33:30 -0800 Subject: [SPARK-11197][SQL] add doc for run SQL on files directly Author: Wenchen Fan Closes #9467 from cloud-fan/doc. --- docs/sql-programming-guide.md | 38 ++++++++++++++++++++++++++++++++++++++ 1 file changed, 38 insertions(+) (limited to 'docs/sql-programming-guide.md') diff --git a/docs/sql-programming-guide.md b/docs/sql-programming-guide.md index 510b359972..2fe5c36338 100644 --- a/docs/sql-programming-guide.md +++ b/docs/sql-programming-guide.md @@ -882,6 +882,44 @@ saveDF(select(df, "name", "age"), "namesAndAges.parquet", "parquet") +### Run SQL on files directly + +Instead of using read API to load a file into DataFrame and query it, you can also query that +file directly with SQL. + +
+
+ +{% highlight scala %} +val df = sqlContext.sql("SELECT * FROM parquet.`examples/src/main/resources/users.parquet`") +{% endhighlight %} + +
+ +
+ +{% highlight java %} +DataFrame df = sqlContext.sql("SELECT * FROM parquet.`examples/src/main/resources/users.parquet`"); +{% endhighlight %} +
+ +
+ +{% highlight python %} +df = sqlContext.sql("SELECT * FROM parquet.`examples/src/main/resources/users.parquet`") +{% endhighlight %} + +
+ +
+ +{% highlight r %} +df <- sql(sqlContext, "SELECT * FROM parquet.`examples/src/main/resources/users.parquet`") +{% endhighlight %} + +
+
+ ### Save Modes Save operations can optionally take a `SaveMode`, that specifies how to handle existing data if -- cgit v1.2.3