/
ddbloader.go
185 lines (176 loc) · 6.14 KB
/
ddbloader.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
package main
import (
"errors"
"fmt"
"io"
"log"
"net/http"
"os"
"reflect"
"strconv"
"strings"
"github.com/aws/aws-sdk-go/aws"
"github.com/aws/aws-sdk-go/aws/credentials"
"github.com/aws/aws-sdk-go/aws/session"
"github.com/codingconcepts/env"
"github.com/go-playground/validator/v10"
"github.com/hashicorp/logutils"
"github.com/ourrootsorg/cms-server/model"
"github.com/ourrootsorg/cms-server/persist/dynamo"
)
func main() {
config, err := ParseEnv()
if err != nil {
log.Fatalf("[FATAL] %v", err)
}
filter := &logutils.LevelFilter{
Levels: []logutils.LogLevel{"DEBUG", "INFO", "ERROR", "FATAL"},
MinLevel: logutils.LogLevel(config.MinLogLevel),
Writer: os.Stderr,
}
log.SetOutput(filter)
cfgs := make([]*aws.Config, 0)
if config.LocalTest {
// Use DynamoDB local
cfgs = append(cfgs, &aws.Config{
Region: aws.String(config.Region),
Endpoint: aws.String("http://localhost:18000"),
DisableSSL: aws.Bool(true),
Credentials: credentials.NewStaticCredentials("ACCESS_KEY", "SECRET", ""),
})
}
sess, err := session.NewSession(cfgs...)
if err != nil {
log.Fatalf("[FATAL] Error creating AWS session: %v", err)
}
p, err := dynamo.NewPersister(sess, config.DynamoDBTableName)
if err != nil {
log.Fatalf("[FATAL] Error creating DynamoDB persister: %v", err)
}
err = p.SetThroughput(config.LoadThroughput, config.LoadThroughput)
if err != nil {
log.Fatalf("[FATAL] Error setting table throughput for data load: %v", err)
}
var fileNames string
if config.FileURLs != "" {
fileNames = config.FileURLs
} else {
fileNames = config.FilePaths
}
for _, fileName := range strings.Split(fileNames, ",") {
r := openFile(config, fileName)
defer r.Close()
switch {
case strings.HasSuffix(fileName, "places.tsv"):
err = p.LoadPlaceData(r)
if err != nil {
log.Fatalf("[FATAL] Unable to load place data from %s: %v", fileName, err)
}
log.Printf("[INFO] Loaded place data from %s", fileName)
case strings.HasSuffix(fileName, "place_settings.tsv"):
log.Printf("[DEBUG] Loading place settings data from %s", fileName)
err = p.LoadPlaceSettingsData(r)
if err != nil {
log.Fatalf("[FATAL] Unable to load place settings data from %s: %v", fileName, err)
}
log.Printf("[INFO] Loaded place settings data from %s", fileName)
case strings.HasSuffix(fileName, "place_words.tsv"):
err = p.LoadPlaceWordData(r)
if err != nil {
log.Fatalf("[FATAL] Unable to load place word data from %s: %v", fileName, err)
}
log.Printf("[INFO] Loaded place words data from %s", fileName)
case strings.HasSuffix(fileName, "givenname_variants.tsv"):
err = p.LoadNameVariantsData(r, model.GivenType)
if err != nil {
log.Fatalf("[FATAL] Unable to load name variants data from %s: %v", fileName, err)
}
log.Printf("[INFO] Loaded name variants data from %s", fileName)
case strings.HasSuffix(fileName, "surname_variants.tsv"):
err = p.LoadNameVariantsData(r, model.SurnameType)
if err != nil {
log.Fatalf("[FATAL] Unable to load name variants data from %s: %v", fileName, err)
}
log.Printf("[INFO] Loaded name variants data from %s", fileName)
default:
log.Fatalf("[FATAL] Don't know how to load '%s'", fileName)
}
}
err = p.SetThroughput(config.NormalThroughput, config.NormalThroughput)
if err != nil {
log.Fatalf("[FATAL] Error setting final table throughput. **WARNING** You should review the provisioned throughput ASAP, because the current throughput may be expensive!: %v", err)
}
}
func openFile(config *Env, fileName string) io.ReadCloser {
var reader io.ReadCloser
if config.FileURLs != "" {
resp, err := http.Get(fileName)
if err != nil {
log.Fatalf("[FATAL] Unable to open file URL %s: %v", fileName, err)
}
reader = resp.Body
} else {
f, err := os.Open(fileName)
if err != nil {
log.Fatalf("[FATAL] Unable to open file path %s: %v", fileName, err)
}
reader = f
}
return reader
}
// Env holds values parse from environment variables
type Env struct {
MinLogLevel string `env:"MIN_LOG_LEVEL" validate:"omitempty,eq=DEBUG|eq=INFO|eq=ERROR"`
DynamoDBTableName string `env:"DYNAMODB_TABLE_NAME" validate:"required"`
LoadThroughput int `env:"LOAD_THROUGHPUT" validate:"numeric,min=2"`
NormalThroughput int `env:"NORMAL_THROUGHPUT" validate:"numeric,min=2"`
Region string `env:"AWS_REGION" validate:"required"`
FileURLs string `env:"FILE_URLS" validate:"required_without=FilePaths,omitempty"`
FilePaths string `env:"FILE_PATHS" validate:"required_without=FileURLs,omitempty"`
LocalTestString string `env:"LOCAL_TEST" validate:"omitempty,eq=true|eq=false"`
LocalTest bool
}
// ParseEnv parses and validates environment variables and stores them in the Env structure
func ParseEnv() (*Env, error) {
var config Env
if err := env.Set(&config); err != nil {
return nil, err
}
validate := validator.New()
validate.RegisterTagNameFunc(func(fld reflect.StructField) string {
return fld.Tag.Get("env")
})
err := validate.Struct(config)
if err != nil {
errs := "Error parsing environment variables:\n"
for _, fe := range err.(validator.ValidationErrors) {
switch fe.Field() {
case "MIN_LOG_LEVEL":
errs += fmt.Sprintf(" Invalid MIN_LOG_LEVEL: '%v', valid values are 'DEBUG', 'INFO' or 'ERROR'\n", fe.Value())
case "LOCAL_TEST":
errs += fmt.Sprintf(" Invalid LOCAL_TEST: '%v', valid values are 'TRUE' or 'FALSE'\n", fe.Value())
case "AWS_REGION":
errs += fmt.Sprintf(" AWS_REGION is required\n")
case "LOAD_THROUGHPUT", "NORMAL_THROUGHPUT":
errs += fmt.Sprintf(" Invalid %s: %v, must be a numeric value >= 2\n", fe.Field(), fe.Value())
default:
errs += fmt.Sprintf(" Other error, fe: %#v", fe)
}
}
return nil, errors.New(errs)
}
if config.MinLogLevel == "" {
config.MinLogLevel = "DEBUG"
}
if config.FileURLs != "" && config.FilePaths != "" {
return nil, errors.New("Must set only one of FILE_URL or FILE_PATH")
}
if config.LocalTestString != "" {
config.LocalTest, err = strconv.ParseBool(config.LocalTestString)
if err != nil {
// should never happen
return nil, fmt.Errorf("Couldn't parse LOCAL_TEST value '%s'", config.LocalTestString)
}
}
return &config, nil
}