You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@spark.apache.org by do...@apache.org on 2018/09/17 18:26:33 UTC
spark git commit: [SPARK-25423][SQL] Output "dataFilters" in
DataSourceScanExec.metadata
Repository: spark
Updated Branches:
refs/heads/master 30aa37fca -> 4b9542e3a
[SPARK-25423][SQL] Output "dataFilters" in DataSourceScanExec.metadata
## What changes were proposed in this pull request?
Output `dataFilters` in `DataSourceScanExec.metadata`.
## How was this patch tested?
unit tests
Closes #22435 from wangyum/SPARK-25423.
Authored-by: Yuming Wang <yu...@ebay.com>
Signed-off-by: Dongjoon Hyun <do...@apache.org>
Project: http://git-wip-us.apache.org/repos/asf/spark/repo
Commit: http://git-wip-us.apache.org/repos/asf/spark/commit/4b9542e3
Tree: http://git-wip-us.apache.org/repos/asf/spark/tree/4b9542e3
Diff: http://git-wip-us.apache.org/repos/asf/spark/diff/4b9542e3
Branch: refs/heads/master
Commit: 4b9542e3a3d0c493a05061be5a9f8d278c0ac980
Parents: 30aa37f
Author: Yuming Wang <yu...@ebay.com>
Authored: Mon Sep 17 11:26:08 2018 -0700
Committer: Dongjoon Hyun <do...@apache.org>
Committed: Mon Sep 17 11:26:08 2018 -0700
----------------------------------------------------------------------
.../spark/sql/execution/DataSourceScanExec.scala | 1 +
.../DataSourceScanExecRedactionSuite.scala | 16 ++++++++++++++++
2 files changed, 17 insertions(+)
----------------------------------------------------------------------
http://git-wip-us.apache.org/repos/asf/spark/blob/4b9542e3/sql/core/src/main/scala/org/apache/spark/sql/execution/DataSourceScanExec.scala
----------------------------------------------------------------------
diff --git a/sql/core/src/main/scala/org/apache/spark/sql/execution/DataSourceScanExec.scala b/sql/core/src/main/scala/org/apache/spark/sql/execution/DataSourceScanExec.scala
index 36ed016..738c066 100644
--- a/sql/core/src/main/scala/org/apache/spark/sql/execution/DataSourceScanExec.scala
+++ b/sql/core/src/main/scala/org/apache/spark/sql/execution/DataSourceScanExec.scala
@@ -284,6 +284,7 @@ case class FileSourceScanExec(
"Batched" -> supportsBatch.toString,
"PartitionFilters" -> seqToString(partitionFilters),
"PushedFilters" -> seqToString(pushedDownFilters),
+ "DataFilters" -> seqToString(dataFilters),
"Location" -> locationDesc)
val withOptPartitionCount =
relation.partitionSchemaOption.map { _ =>
http://git-wip-us.apache.org/repos/asf/spark/blob/4b9542e3/sql/core/src/test/scala/org/apache/spark/sql/execution/DataSourceScanExecRedactionSuite.scala
----------------------------------------------------------------------
diff --git a/sql/core/src/test/scala/org/apache/spark/sql/execution/DataSourceScanExecRedactionSuite.scala b/sql/core/src/test/scala/org/apache/spark/sql/execution/DataSourceScanExecRedactionSuite.scala
index c8d045a..11a1c9a 100644
--- a/sql/core/src/test/scala/org/apache/spark/sql/execution/DataSourceScanExecRedactionSuite.scala
+++ b/sql/core/src/test/scala/org/apache/spark/sql/execution/DataSourceScanExecRedactionSuite.scala
@@ -83,4 +83,20 @@ class DataSourceScanExecRedactionSuite extends QueryTest with SharedSQLContext {
}
}
+ test("FileSourceScanExec metadata") {
+ withTempPath { path =>
+ val dir = path.getCanonicalPath
+ spark.range(0, 10).write.parquet(dir)
+ val df = spark.read.parquet(dir)
+
+ assert(isIncluded(df.queryExecution, "Format"))
+ assert(isIncluded(df.queryExecution, "ReadSchema"))
+ assert(isIncluded(df.queryExecution, "Batched"))
+ assert(isIncluded(df.queryExecution, "PartitionFilters"))
+ assert(isIncluded(df.queryExecution, "PushedFilters"))
+ assert(isIncluded(df.queryExecution, "DataFilters"))
+ assert(isIncluded(df.queryExecution, "Location"))
+ }
+ }
+
}
---------------------------------------------------------------------
To unsubscribe, e-mail: commits-unsubscribe@spark.apache.org
For additional commands, e-mail: commits-help@spark.apache.org