-
Notifications
You must be signed in to change notification settings - Fork 703
/
SparkSQLUtil.scala
121 lines (108 loc) · 5.25 KB
/
SparkSQLUtil.scala
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.spark.sql.util
import java.lang.reflect.Method
import org.apache.hadoop.conf.Configuration
import org.apache.spark.SparkContext
import org.apache.spark.broadcast.Broadcast
import org.apache.spark.sql.{DataFrame, Dataset, SparkSession}
import org.apache.spark.sql.catalyst.plans.logical.{LogicalPlan, Statistics}
import org.apache.spark.sql.catalyst.rules.Rule
import org.apache.spark.sql.internal.{SessionState, SQLConf}
import org.apache.spark.util.{CarbonReflectionUtils, SerializableConfiguration, SparkUtil}
object SparkSQLUtil {
def sessionState(sparkSession: SparkSession): SessionState = sparkSession.sessionState
def execute(logicalPlan: LogicalPlan, sparkSession: SparkSession): DataFrame = {
Dataset.ofRows(sparkSession, logicalPlan)
}
def getSparkSession: SparkSession = {
SparkSession.getDefaultSession.get
}
def invokeStatsMethod(logicalPlanObj: LogicalPlan, conf: SQLConf): Statistics = {
if (SparkUtil.isSparkVersionEqualTo("2.2")) {
val method: Method = logicalPlanObj.getClass.getMethod("stats", classOf[SQLConf])
method.invoke(logicalPlanObj, conf).asInstanceOf[Statistics]
} else if (SparkUtil.isSparkVersionXandAbove("2.3")) {
val method: Method = logicalPlanObj.getClass.getMethod("stats")
method.invoke(logicalPlanObj).asInstanceOf[Statistics]
} else {
throw new UnsupportedOperationException("Spark version not supported")
}
}
def getReorderJoinObj(conf: SQLConf): Rule[LogicalPlan] = {
if (SparkUtil.isSparkVersionEqualTo("2.2")) {
val className = "org.apache.spark.sql.catalyst.optimizer.ReorderJoin";
CarbonReflectionUtils.createObject(className, conf)._1.asInstanceOf[Rule[LogicalPlan]]
} else if (SparkUtil.isSparkVersionXandAbove("2.3")) {
val className = "org.apache.spark.sql.catalyst.optimizer.ReorderJoin$";
CarbonReflectionUtils.createObjectOfPrivateConstructor(className)._1
.asInstanceOf[Rule[LogicalPlan]]
} else {
throw new UnsupportedOperationException("Spark version not supported")
}
}
def getEliminateOuterJoinObj(conf: SQLConf): Rule[LogicalPlan] = {
if (SparkUtil.isSparkVersionEqualTo("2.2")) {
val className = "org.apache.spark.sql.catalyst.optimizer.EliminateOuterJoin";
CarbonReflectionUtils.createObject(className, conf)._1.asInstanceOf[Rule[LogicalPlan]]
} else if (SparkUtil.isSparkVersionXandAbove("2.3")) {
val className = "org.apache.spark.sql.catalyst.optimizer.EliminateOuterJoin$";
CarbonReflectionUtils.createObjectOfPrivateConstructor(className)._1
.asInstanceOf[Rule[LogicalPlan]]
} else {
throw new UnsupportedOperationException("Spark version not supported")
}
}
def getNullPropagationObj(conf: SQLConf): Rule[LogicalPlan] = {
if (SparkUtil.isSparkVersionEqualTo("2.2")) {
val className = "org.apache.spark.sql.catalyst.optimizer.NullPropagation";
CarbonReflectionUtils.createObject(className, conf)._1.asInstanceOf[Rule[LogicalPlan]]
} else if (SparkUtil.isSparkVersionXandAbove("2.3")) {
val className = "org.apache.spark.sql.catalyst.optimizer.NullPropagation$";
CarbonReflectionUtils.createObjectOfPrivateConstructor(className)._1
.asInstanceOf[Rule[LogicalPlan]]
} else {
throw new UnsupportedOperationException("Spark version not supported")
}
}
def getCheckCartesianProductsObj(conf: SQLConf): Rule[LogicalPlan] = {
if (SparkUtil.isSparkVersionEqualTo("2.2")) {
val className = "org.apache.spark.sql.catalyst.optimizer.CheckCartesianProducts";
CarbonReflectionUtils.createObject(className, conf)._1.asInstanceOf[Rule[LogicalPlan]]
} else if (SparkUtil.isSparkVersionXandAbove("2.3")) {
val className = "org.apache.spark.sql.catalyst.optimizer.CheckCartesianProducts$";
CarbonReflectionUtils.createObjectOfPrivateConstructor(className)._1
.asInstanceOf[Rule[LogicalPlan]]
} else {
throw new UnsupportedOperationException("Spark version not supported")
}
}
/**
* Method to broadcast a variable using spark SerializableConfiguration class
*
* @param sparkContext
* @param hadoopConf
* @return
*/
def broadCastHadoopConf(sparkContext: SparkContext,
hadoopConf: Configuration): Broadcast[SerializableConfiguration] = {
sparkContext.broadcast(getSerializableConfigurableInstance(hadoopConf))
}
def getSerializableConfigurableInstance(hadoopConf: Configuration): SerializableConfiguration = {
new SerializableConfiguration(hadoopConf)
}
}