-
Notifications
You must be signed in to change notification settings - Fork 1
/
HiveSqlDialect.java
157 lines (138 loc) · 7.11 KB
/
HiveSqlDialect.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
package com.exasol.adapter.dialects.hive;
import static com.exasol.adapter.AdapterProperties.CATALOG_NAME_PROPERTY;
import static com.exasol.adapter.AdapterProperties.SCHEMA_NAME_PROPERTY;
import static com.exasol.adapter.capabilities.AggregateFunctionCapability.*;
import static com.exasol.adapter.capabilities.LiteralCapability.*;
import static com.exasol.adapter.capabilities.MainCapability.*;
import static com.exasol.adapter.capabilities.PredicateCapability.*;
import static com.exasol.adapter.capabilities.ScalarFunctionCapability.*;
import static com.exasol.adapter.dialects.hive.HiveProperties.HIVE_CAST_NUMBER_TO_DECIMAL_PROPERTY;
import java.sql.SQLException;
import java.util.*;
import com.exasol.adapter.AdapterProperties;
import com.exasol.adapter.capabilities.Capabilities;
import com.exasol.adapter.dialects.*;
import com.exasol.adapter.dialects.rewriting.ImportIntoTemporaryTableQueryRewriter;
import com.exasol.adapter.dialects.rewriting.SqlGenerationContext;
import com.exasol.adapter.jdbc.*;
import com.exasol.adapter.properties.CastNumberToDecimalProperty;
import com.exasol.adapter.sql.ScalarFunction;
import com.exasol.errorreporting.ExaError;
/**
* Dialect for Hive, using the Cloudera Hive JDBC Driver/Connector (developed by Simba). Only supports Hive 2.1.0 and
* later because of the order by (nulls first/last option).
*/
public class HiveSqlDialect extends AbstractSqlDialect {
static final String NAME = "HIVE";
private static final Capabilities CAPABILITIES = createCapabilityList();
private static Capabilities createCapabilityList() {
return Capabilities.builder()
.addMain(SELECTLIST_PROJECTION, SELECTLIST_EXPRESSIONS, FILTER_EXPRESSIONS, AGGREGATE_SINGLE_GROUP,
AGGREGATE_GROUP_BY_COLUMN, AGGREGATE_HAVING, ORDER_BY_COLUMN, ORDER_BY_EXPRESSION, LIMIT, JOIN,
JOIN_TYPE_INNER, JOIN_TYPE_LEFT_OUTER, JOIN_TYPE_RIGHT_OUTER, JOIN_TYPE_FULL_OUTER,
JOIN_CONDITION_EQUI)
.addPredicate(AND, OR, NOT, EQUAL, NOTEQUAL, LESS, LESSEQUAL, LIKE, REGEXP_LIKE, BETWEEN, IN_CONSTLIST,
IS_NULL, IS_NOT_NULL)
.addLiteral(NULL, BOOL, DATE, TIMESTAMP, DOUBLE, EXACTNUMERIC, STRING)
.addAggregateFunction(COUNT, COUNT_STAR, COUNT_DISTINCT, SUM, SUM_DISTINCT, MIN, MAX, AVG, AVG_DISTINCT,
STDDEV_POP, STDDEV_POP_DISTINCT, STDDEV_SAMP, STDDEV_SAMP_DISTINCT, VAR_POP, VAR_POP_DISTINCT,
VAR_SAMP, VAR_SAMP_DISTINCT, COUNT_TUPLE)
.addScalarFunction(ADD, SUB, MULT, FLOAT_DIV, NEG, ABS, ACOS, ASIN, ATAN, CEIL, COS, DEGREES, DIV, EXP,
FLOOR, LN, LOG, MOD, POWER, RADIANS, SIGN, SIN, SQRT, TAN, ASCII, CONCAT, LENGTH, LOWER, LPAD,
REPEAT, REVERSE, RPAD, SOUNDEX, SPACE, SUBSTR, TRANSLATE, UPPER, ADD_DAYS, ADD_MONTHS,
CURRENT_DATE, CURRENT_TIMESTAMP, DATE_TRUNC, DAY, DAYS_BETWEEN, MINUTE, MONTH, MONTHS_BETWEEN,
SECOND, WEEK, CAST, BIT_AND, BIT_OR, BIT_XOR, CURRENT_USER, BIT_LSHIFT, BIT_RSHIFT, HOUR,
INITCAP)//
.build();
}
/**
* Create a new instance of the {@link HiveSqlDialect}.
*
* @param connectionFactory factory for the JDBC connection to the remoted data source
* @param properties user-defined adapter properties
*/
public HiveSqlDialect(final ConnectionFactory connectionFactory, final AdapterProperties properties) {
super(connectionFactory, properties,
Set.of(CATALOG_NAME_PROPERTY, SCHEMA_NAME_PROPERTY, HIVE_CAST_NUMBER_TO_DECIMAL_PROPERTY),
List.of(CastNumberToDecimalProperty.validator(HIVE_CAST_NUMBER_TO_DECIMAL_PROPERTY)));
}
@Override
public String getName() {
return NAME;
}
@Override
public Capabilities getCapabilities() {
return CAPABILITIES;
}
/**
* Quote from user manual The Cloudera JDBC Driver for Apache Hive supports both catalogs and schemas to make it
* easy for the driver to work with various JDBC applications. Since Hive only organizes tables into
* schemas/databases, the driver provides a synthetic catalog called “HIVE” under which all of the schemas/databases
* are organized. The driver also maps the JDBC schema to the Hive schema/database.
*/
@Override
public StructureElementSupport supportsJdbcCatalogs() {
return StructureElementSupport.SINGLE;
}
@Override
public StructureElementSupport supportsJdbcSchemas() {
return StructureElementSupport.MULTIPLE;
}
@Override
// https://cwiki.apache.org/confluence/display/Hive/LanguageManual+DDL
public String applyQuote(final String identifier) {
return "`" + identifier.replace("`", "``") + "`";
}
@Override
public boolean requiresCatalogQualifiedTableNames(final SqlGenerationContext context) {
return false;
}
@Override
public boolean requiresSchemaQualifiedTableNames(final SqlGenerationContext context) {
return true;
}
@Override
public NullSorting getDefaultNullSorting() {
return NullSorting.NULLS_SORTED_LOW;
}
@Override
// https://cwiki.apache.org/confluence/display/Hive/LanguageManual+Types#LanguageManualTypes-StringsstringStrings
// https://cwiki.apache.org/confluence/display/Hive/CAST...FORMAT+with+SQL%3A2016+datetime+formats
public String getStringLiteral(final String value) {
if (value == null) {
return "NULL";
} else {
return "'" + value.replace("\\", "\\\\").replace("'", "\\'") + "'";
}
}
@Override
public SqlGenerator getSqlGenerator(final SqlGenerationContext context) {
return new HiveSqlGenerationVisitor(this, context);
}
@Override
public Map<ScalarFunction, String> getScalarFunctionAliases() {
final Map<ScalarFunction, String> scalarAliases = new EnumMap<>(ScalarFunction.class);
scalarAliases.put(ScalarFunction.ADD_DAYS, "DATE_ADD");
scalarAliases.put(ScalarFunction.DAYS_BETWEEN, "DATEDIFF");
scalarAliases.put(ScalarFunction.WEEK, "WEEKOFYEAR");
scalarAliases.put(ScalarFunction.CURRENT_USER, "CURRENT_USER()");
scalarAliases.put(ScalarFunction.BIT_LSHIFT, "SHIFTLEFT");
scalarAliases.put(ScalarFunction.BIT_RSHIFT, "SHIFTRIGHT");
return scalarAliases;
}
@Override
protected RemoteMetadataReader createRemoteMetadataReader() {
try {
return new HiveMetadataReader(this.connectionFactory.getConnection(), this.properties);
} catch (final SQLException exception) {
throw new RemoteMetadataReaderException(ExaError.messageBuilder("E-VSHIVE-1")
.message("Unable to create Hive remote metadata reader. Caused by: {{cause|u}}",
exception.getMessage()) //
.toString(), exception);
}
}
@Override
protected QueryRewriter createQueryRewriter() {
return new ImportIntoTemporaryTableQueryRewriter(this, createRemoteMetadataReader(), this.connectionFactory);
}
}