apache · karuppayya · May 31, 2020 · Jun 1, 2020 · Jun 2, 2020 · Jun 3, 2020
diff --git a/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/interface.scala b/sql/catalyst/src/main/scala/org/apache/spark/sql/catalyst/catalog/interface.scala
@@ -654,7 +654,7 @@ case class HiveTableRelation(
     tableMeta: CatalogTable,
     dataCols: Seq[AttributeReference],
     partitionCols: Seq[AttributeReference],
-    tableStats: Option[Statistics] = None,
+    tableStats: Option[Statistics] = Some(Statistics(sizeInBytes = SQLConf.get.defaultSizeInBytes)),
     @transient prunedPartitions: Option[Seq[CatalogTablePartition]] = None)
   extends LeafNode with MultiInstanceRelation {
   assert(tableMeta.identifier.database.isDefined)

diff --git a/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveSessionStateBuilder.scala b/sql/hive/src/main/scala/org/apache/spark/sql/hive/HiveSessionStateBuilder.scala
@@ -82,8 +82,8 @@ class HiveSessionStateBuilder(session: SparkSession, parentState: Option[Session
 
     override val postHocResolutionRules: Seq[Rule[LogicalPlan]] =
       new DetectAmbiguousSelfJoin(conf) +:
-        new DetermineTableStats(session) +:
         RelationConversions(conf, catalog) +:
+        new DetermineTableStats(session) +:
         PreprocessTableCreation(session) +:
         PreprocessTableInsertion(conf) +:
         DataSourceAnalysis(conf) +:

diff --git a/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveExplainSuite.scala b/sql/hive/src/test/scala/org/apache/spark/sql/hive/execution/HiveExplainSuite.scala
@@ -62,13 +62,15 @@ class HiveExplainSuite extends QueryTest with SQLTestUtils with TestHiveSingleto
     }
 
     // No statistics information if "cost" is not specified
-    checkKeywordsNotExist(sql("EXPLAIN  SELECT * FROM src "), "sizeInBytes", "rowCount")
+    checkKeywordsExist(sql("EXPLAIN  SELECT * FROM src "), "sizeInBytes=8.0 EiB")
+    checkKeywordsNotExist(sql("EXPLAIN  SELECT * FROM src "), "rowCount")
   }
 
   test("explain extended command") {
     checkKeywordsExist(sql(" explain   select * from src where key=123 "),
                    "== Physical Plan ==",
-                   "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe")
+                   "org.apache.hadoop.hive.serde2.lazy.LazySimpleSerDe",
+                   "Statistics(sizeInBytes=8.0 EiB)")
 
     checkKeywordsNotExist(sql(" explain   select * from src where key=123 "),
                    "== Parsed Logical Plan ==",
@@ -81,7 +83,6 @@ class HiveExplainSuite extends QueryTest with SQLTestUtils with TestHiveSingleto
                    "Type",
                    "Provider",
                    "Properties",
-                   "Statistics",
                    "Location",
                    "Serde Library",
                    "InputFormat",