forked from attic-labs/noms
-
Notifications
You must be signed in to change notification settings - Fork 0
/
spec.go
332 lines (280 loc) · 8.46 KB
/
spec.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
// Copyright 2016 Attic Labs, Inc. All rights reserved.
// Licensed under the Apache License, version 2.0:
// http://www.apache.org/licenses/LICENSE-2.0
// Package spec provides builders and parsers for spelling Noms databases,
// datasets and values.
package spec
import (
"errors"
"fmt"
"net/url"
"regexp"
"strings"
"os"
"github.com/attic-labs/noms/go/chunks"
"github.com/attic-labs/noms/go/datas"
"github.com/attic-labs/noms/go/nbs"
"github.com/attic-labs/noms/go/types"
"github.com/aws/aws-sdk-go/aws"
"github.com/aws/aws-sdk-go/aws/session"
"github.com/aws/aws-sdk-go/service/dynamodb"
"github.com/aws/aws-sdk-go/service/s3"
)
const Separator = "::"
var datasetRe = regexp.MustCompile("^" + datas.DatasetRe.String() + "$")
// SpecOptions customize Spec behavior.
type SpecOptions struct {
// Authorization token for requests. For example, if the database is HTTP
// this will used for an `Authorization: Bearer ${authorization}` header.
Authorization string
}
// Spec locates a Noms database, dataset, or value globally.
type Spec struct {
// Protocol is one of "mem", "ldb", "http", or "https".
Protocol string
// DatabaseName is the name of the Spec's database, which is the string after
// "protocol:". http/https specs include their leading "//" characters.
DatabaseName string
// Options are the SpecOptions that the Spec was constructed with.
Options SpecOptions
// Path is nil unless the spec was created with ForPath.
Path AbsolutePath
// db is lazily created, so it needs to be a pointer to a Database.
db *datas.Database
}
func newSpec(dbSpec string, opts SpecOptions) (Spec, error) {
protocol, dbName, err := parseDatabaseSpec(dbSpec)
if err != nil {
return Spec{}, err
}
return Spec{
Protocol: protocol,
DatabaseName: dbName,
Options: opts,
db: new(datas.Database),
}, nil
}
// ForDatabase parses a spec for a Database.
func ForDatabase(spec string) (Spec, error) {
return ForDatabaseOpts(spec, SpecOptions{})
}
// ForDatabaseOpts parses a spec for a Database.
func ForDatabaseOpts(spec string, opts SpecOptions) (Spec, error) {
return newSpec(spec, opts)
}
// ForDataset parses a spec for a Dataset.
func ForDataset(spec string) (Spec, error) {
return ForDatasetOpts(spec, SpecOptions{})
}
// ForDatasetOpts parses a spec for a Dataset.
func ForDatasetOpts(spec string, opts SpecOptions) (Spec, error) {
dbSpec, pathStr, err := splitDatabaseSpec(spec)
sp, err := newSpec(dbSpec, opts)
if err != nil {
return Spec{}, err
}
path, err := NewAbsolutePath(pathStr)
if err != nil {
return Spec{}, err
}
if path.Dataset == "" {
return Spec{}, errors.New("dataset name required for dataset spec")
}
if !path.Path.IsEmpty() {
return Spec{}, errors.New("path is not allowed for dataset spec")
}
sp.Path = path
return sp, nil
}
// ForPath parses a spec for a path to a Value.
func ForPath(spec string) (Spec, error) {
return ForPathOpts(spec, SpecOptions{})
}
// ForPathOpts parses a spec for a path to a Value.
func ForPathOpts(spec string, opts SpecOptions) (Spec, error) {
dbSpec, pathStr, err := splitDatabaseSpec(spec)
if err != nil {
return Spec{}, err
}
var path AbsolutePath
if pathStr != "" {
path, err = NewAbsolutePath(pathStr)
if err != nil {
return Spec{}, err
}
}
sp, err := newSpec(dbSpec, opts)
if err != nil {
return Spec{}, err
}
sp.Path = path
return sp, nil
}
func (sp Spec) String() string {
s := sp.Protocol
if s != "mem" {
s += ":" + sp.DatabaseName
}
p := sp.Path.String()
if p != "" {
s += Separator + p
}
return s
}
// GetDatabase returns the Database instance that this Spec's DatabaseName
// describes. The same Database instance is returned every time, unless Close
// is called. If the Spec is closed, it is re-opened with a new Database.
func (sp Spec) GetDatabase() datas.Database {
if *sp.db == nil {
*sp.db = sp.createDatabase()
}
return *sp.db
}
// NewChunkStore returns a new ChunkStore instance that this Spec's
// DatabaseName describes. It's unusual to call this method, GetDatabase is
// more useful. Unlike GetDatabase, a new ChunkStore instance is returned every
// time. If there is no ChunkStore, for example remote databases, returns nil.
func (sp Spec) NewChunkStore() chunks.ChunkStore {
switch sp.Protocol {
case "http", "https":
return nil
case "aws":
return parseAWSSpec(sp.Href())
case "nbs":
return nbs.NewLocalStore(sp.DatabaseName, 1<<28)
case "mem":
return chunks.NewMemoryStore()
}
panic("unreachable")
}
func parseAWSSpec(awsURL string) chunks.ChunkStore {
u, _ := url.Parse(awsURL)
parts := strings.SplitN(u.Host, ":", 2) // [table] [, bucket]?
sess := session.Must(session.NewSession(aws.NewConfig().WithRegion("us-west-2")))
ddb := dynamodb.New(sess)
if len(parts) == 1 {
return chunks.NewDynamoStore(parts[0], u.Path, ddb, false)
}
return nbs.NewAWSStore(parts[0], u.Path, parts[1], s3.New(sess), ddb, 1<<28)
}
// GetDataset returns the current Dataset instance for this Spec's Database.
// GetDataset is live, so if Commit is called on this Spec's Database later, a
// new up-to-date Dataset will returned on the next call to GetDataset. If
// this is not a Dataset spec, returns nil.
func (sp Spec) GetDataset() (ds datas.Dataset) {
if sp.Path.Dataset != "" {
ds = sp.GetDatabase().GetDataset(sp.Path.Dataset)
}
return
}
// GetValue returns the Value at this Spec's Path within its Database, or nil
// if this isn't a Path Spec or if that path isn't found.
func (sp Spec) GetValue() (val types.Value) {
if !sp.Path.IsEmpty() {
val = sp.Path.Resolve(sp.GetDatabase())
}
return
}
// Href treats the Protocol and DatabaseName as a URL, and returns its href.
// For example, the spec http://example.com/path::ds returns
// "http://example.com/path". If the Protocol is not "http" or "http", returns
// an empty string.
func (sp Spec) Href() string {
switch proto := sp.Protocol; proto {
case "http", "https", "aws":
return proto + ":" + sp.DatabaseName
default:
return ""
}
}
// Pin returns a Spec in which the dataset component, if any, has been replaced
// with the hash of the HEAD of that dataset. This "pins" the path to the state
// of the database at the current moment in time. Returns itself if the
// PathSpec is already "pinned".
func (sp Spec) Pin() (Spec, bool) {
var ds datas.Dataset
if !sp.Path.IsEmpty() {
if !sp.Path.Hash.IsEmpty() {
// Spec is already pinned.
return sp, true
}
ds = sp.GetDatabase().GetDataset(sp.Path.Dataset)
} else {
ds = sp.GetDataset()
}
commit, ok := ds.MaybeHead()
if !ok {
return Spec{}, false
}
r := sp
r.Path.Hash = commit.Hash()
r.Path.Dataset = ""
return r, true
}
func (sp Spec) Close() error {
db := *sp.db
if db == nil {
return nil
}
*sp.db = nil
return db.Close()
}
func (sp Spec) createDatabase() datas.Database {
switch sp.Protocol {
case "http", "https":
return datas.NewRemoteDatabase(sp.Href(), sp.Options.Authorization)
case "aws":
return datas.NewDatabase(parseAWSSpec(sp.Href()))
case "nbs":
os.Mkdir(sp.DatabaseName, 0777)
return datas.NewDatabase(nbs.NewLocalStore(sp.DatabaseName, 1<<28))
case "mem":
return datas.NewDatabase(chunks.NewMemoryStore())
}
panic("unreachable")
}
func parseDatabaseSpec(spec string) (protocol, name string, err error) {
if len(spec) == 0 {
err = fmt.Errorf("Empty spec")
return
}
parts := strings.SplitN(spec, ":", 2) // [protocol] [, path]?
// If there was no ":" then this is either a mem spec, or a filesystem path.
// This is ambiguous if the file system path is "mem" but that just means the
// path needs to be explicitly "nbs:mem".
if len(parts) == 1 {
if spec == "mem" {
protocol = "mem"
} else {
protocol, name = "nbs", spec
}
return
}
switch parts[0] {
case "nbs":
protocol, name = parts[0], parts[1]
case "http", "https", "aws":
u, perr := url.Parse(spec)
if perr != nil {
err = perr
} else if u.Host == "" {
err = fmt.Errorf("%s has empty host", spec)
} else if parts[0] == "aws" && u.Path == "" {
err = fmt.Errorf("%s does not specify a database ID", spec)
} else {
protocol, name = parts[0], parts[1]
}
case "mem":
err = fmt.Errorf(`In-memory database must be specified as "mem", not "mem:"`)
default:
err = fmt.Errorf("Invalid database protocol %s in %s", protocol, spec)
}
return
}
func splitDatabaseSpec(spec string) (string, string, error) {
lastIdx := strings.LastIndex(spec, Separator)
if lastIdx == -1 {
return "", "", fmt.Errorf("Missing %s after database in %s", Separator, spec)
}
return spec[:lastIdx], spec[lastIdx+len(Separator):], nil
}