-
Notifications
You must be signed in to change notification settings - Fork 7
/
Copy pathsql.go
98 lines (85 loc) · 2.69 KB
/
sql.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
package bigquerysql
import (
"fmt"
"strings"
"github.com/pingcap-inc/tidb2dw/pkg/utils"
"github.com/pingcap/errors"
"github.com/pingcap/tiflow/pkg/sink/cloudstorage"
)
func GenMergeInto(tableDef cloudstorage.TableDefinition, datasetID, tableID, externalTableID string) string {
pkColumn := make([]string, 0)
onStat := make([]string, 0)
for _, col := range tableDef.Columns {
if col.IsPK == "true" {
pkColumn = append(pkColumn, col.Name)
onStat = append(onStat, fmt.Sprintf("T.%s = S.%s", col.Name, col.Name))
}
}
updateStat := make([]string, 0, len(tableDef.Columns))
for _, col := range tableDef.Columns {
updateStat = append(updateStat, fmt.Sprintf("`%s` = S.%s", col.Name, col.Name))
}
insertStat := make([]string, 0, len(tableDef.Columns))
for _, col := range tableDef.Columns {
insertStat = append(insertStat, fmt.Sprintf("`%s`", col.Name))
}
valuesStat := make([]string, 0, len(tableDef.Columns))
for _, col := range tableDef.Columns {
valuesStat = append(valuesStat, fmt.Sprintf("S.%s", col.Name))
}
mergeSQL := fmt.Sprintf(
`MERGE INTO %s AS T USING
(
SELECT * EXCEPT(row_num)
FROM (
SELECT
*, row_number() over (partition by %s order by %s desc) as row_num
FROM %s
)
WHERE row_num = 1
) AS S
ON
(
%s
)
WHEN MATCHED AND S.%s != 'D' THEN UPDATE SET %s
WHEN MATCHED AND S.%s = 'D' THEN DELETE
WHEN NOT MATCHED AND S.%s != 'D' THEN INSERT (%s) VALUES (%s);`,
fmt.Sprintf("`%s.%s`", datasetID, tableID),
strings.Join(pkColumn, ", "),
utils.CDCCommitTsColumnName,
fmt.Sprintf("`%s.%s`", datasetID, externalTableID),
strings.Join(onStat, " AND "),
utils.CDCFlagColumnName,
strings.Join(updateStat, ", "),
utils.CDCFlagColumnName,
utils.CDCFlagColumnName,
strings.Join(insertStat, ", "),
strings.Join(valuesStat, ", "),
)
return mergeSQL
}
func GenCreateSchema(columns []cloudstorage.TableCol, pkColumns []string, datasetID, tableID string) (string, error) {
columnRows := make([]string, 0, len(columns))
for _, column := range columns {
row, err := GetBigQueryColumnString(column, true)
if err != nil {
return "", errors.Trace(err)
}
columnRows = append(columnRows, row)
}
sqlRows := make([]string, 0, len(columnRows)+1)
sqlRows = append(sqlRows, columnRows...)
if len(pkColumns) > 0 {
sqlRows = append(sqlRows, fmt.Sprintf("PRIMARY KEY (`%s`) NOT ENFORCED", strings.Join(pkColumns, ", ")))
}
// Add idents
for i := 0; i < len(sqlRows); i++ {
sqlRows[i] = fmt.Sprintf(" %s", sqlRows[i])
}
sql := []string{}
sql = append(sql, fmt.Sprintf(`CREATE OR REPLACE TABLE %s.%s (`, datasetID, tableID)) // TODO: Escape
sql = append(sql, strings.Join(sqlRows, ",\n"))
sql = append(sql, ")")
return strings.Join(sql, "\n"), nil
}