forked from raystack/optimus
-
Notifications
You must be signed in to change notification settings - Fork 1
/
external_table.go
156 lines (129 loc) · 4.45 KB
/
external_table.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
package bigquery
import (
"context"
"net/http"
"strings"
"cloud.google.com/go/bigquery"
"google.golang.org/api/googleapi"
"github.com/goto/optimus/core/resource"
"github.com/goto/optimus/internal/errors"
)
const (
expirationTimeKey = "expiration_time"
skipLeadingRowsKey = "skip_leading_rows"
rangeKey = "range"
)
type ExternalTableHandle struct {
bqExternalTable BqTable
}
func (et ExternalTableHandle) Create(ctx context.Context, res *resource.Resource) error {
externalTable, err := ConvertSpecTo[ExternalTable](res)
if err != nil {
return err
}
meta, err := getMetadataToCreate(externalTable.Description, externalTable.ExtraConfig, res.Metadata().Labels)
if err != nil {
return errors.AddErrContext(err, EntityExternalTable, "failed to get metadata to create for "+res.FullName())
}
if len(externalTable.Schema) > 0 {
meta.Schema = toBQSchema(externalTable.Schema)
}
meta.ExternalDataConfig, err = bqExternalDataConfigTo(externalTable.Source, externalTable.Schema)
if err != nil {
return err
}
err = et.bqExternalTable.Create(ctx, meta)
if err != nil {
var metaErr *googleapi.Error
if errors.As(err, &metaErr) &&
metaErr.Code == 409 && strings.Contains(metaErr.Message, "Already Exists") {
return errors.AlreadyExists(EntityExternalTable, "external table already exists on bigquery: "+res.FullName())
}
return errors.InternalError(EntityExternalTable, "failed to create external table "+res.FullName(), err)
}
return nil
}
func (et ExternalTableHandle) Update(ctx context.Context, res *resource.Resource) error {
externalTable, err := ConvertSpecTo[ExternalTable](res)
if err != nil {
return err
}
meta, err := getMetadataToUpdate(externalTable.Description, externalTable.ExtraConfig, res.Metadata().Labels)
if err != nil {
return errors.AddErrContext(err, EntityExternalTable, "failed to get metadata to update for "+res.FullName())
}
if len(externalTable.Schema) > 0 {
meta.Schema = toBQSchema(externalTable.Schema)
}
meta.ExternalDataConfig, err = bqExternalDataConfigTo(externalTable.Source, externalTable.Schema)
if err != nil {
return err
}
_, err = et.bqExternalTable.Update(ctx, meta, "")
if err != nil {
var metaErr *googleapi.Error
if errors.As(err, &metaErr) && metaErr.Code == http.StatusNotFound {
return errors.NotFound(EntityExternalTable, "failed to update external_table in bigquery for "+res.FullName())
}
return errors.InternalError(EntityExternalTable, "failed to update external_table on bigquery for "+res.FullName(), err)
}
return nil
}
func (et ExternalTableHandle) Exists(ctx context.Context) bool {
_, err := et.bqExternalTable.Metadata(ctx, bigquery.WithMetadataView(bigquery.BasicMetadataView))
// There can be connection issue, we return false for now
return err == nil
}
func NewExternalTableHandle(bq BqTable) *ExternalTableHandle {
return &ExternalTableHandle{bqExternalTable: bq}
}
func bqExternalDataConfigTo(es *ExternalSource, schema Schema) (*bigquery.ExternalDataConfig, error) {
var option bigquery.ExternalDataConfigOptions
var sourceType bigquery.DataFormat
switch bigquery.DataFormat(strings.ToUpper(es.SourceType)) {
case bigquery.GoogleSheets:
option = bqGoogleSheetsOptionsTo(es.Config)
sourceType = bigquery.GoogleSheets
default:
return nil, errors.InvalidArgument(EntityExternalTable, "source format not yet implemented "+es.SourceType)
}
externalConfig := &bigquery.ExternalDataConfig{
SourceFormat: sourceType,
SourceURIs: es.SourceURIs,
Options: option,
}
if len(schema) == 0 {
externalConfig.AutoDetect = true
}
return externalConfig, nil
}
func bqGoogleSheetsOptionsTo(m map[string]any) *bigquery.GoogleSheetsOptions {
var skipLeadingRows int64
// grpc structpb.Struct cast numbers to float64
rows := ConfigAs[float64](m, skipLeadingRowsKey)
if rows > 0 {
skipLeadingRows = int64(rows)
}
sheetRange := ConfigAs[string](m, rangeKey)
return &bigquery.GoogleSheetsOptions{
SkipLeadingRows: skipLeadingRows,
Range: sheetRange,
}
}
func toBQSchema(schema Schema) bigquery.Schema {
var rv bigquery.Schema
for _, field := range schema {
s := &bigquery.FieldSchema{
Name: field.Name,
Description: field.Description,
Type: bigquery.FieldType(strings.ToUpper(field.Type)),
Required: strings.EqualFold(ModeRequired, field.Mode),
Repeated: strings.EqualFold(ModeRepeated, field.Mode),
}
if len(field.Schema) > 0 {
s.Schema = toBQSchema(field.Schema)
}
rv = append(rv, s)
}
return rv
}