/
multiobjectreader.go
87 lines (80 loc) · 1.66 KB
/
multiobjectreader.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
package main
import (
"compress/bzip2"
"compress/gzip"
"context"
"io"
"strings"
"cloud.google.com/go/storage"
)
type MultiObjectReader struct {
ctx context.Context
bucket *storage.BucketHandle
objects []string
objIdx int
reader io.Reader
}
func NewMultiObjectReader(ctx context.Context, bucket *storage.BucketHandle, objects []string) *MultiObjectReader {
return &MultiObjectReader{
ctx,
bucket,
objects[:],
0,
nil,
}
}
// io.Reader implementation adapted primarily from Go's io.MultiReader implementation
// (https://golang.org/src/io/multi.go)
func (m *MultiObjectReader) Read(data []byte) (n int, err error) {
// First time only
if m.reader == nil {
err = m.nextReader()
if err != nil {
return
}
}
for {
n, err = m.reader.Read(data)
if err == io.EOF {
if m.objIdx < len(m.objects) {
err = m.nextReader()
if err != nil {
return
}
}
return
}
if n > 0 || err != io.EOF {
if err == io.EOF && m.objIdx < len(m.objects) {
err = nil
}
return
}
}
return 0, io.EOF
}
func (m *MultiObjectReader) nextReader() error {
nextObj := m.objects[m.objIdx]
reader, err := m.bucket.Object(nextObj).NewReader(m.ctx)
if err != nil {
return err
}
wrapped, err := maybeDecompress(nextObj, reader)
if err != nil {
return err
}
m.objIdx += 1
m.reader = wrapped
return nil
}
func maybeDecompress(filename string, reader io.Reader) (io.Reader, error) {
if *noDecompress == false {
if strings.HasSuffix(filename, ".gz") {
return gzip.NewReader(reader)
}
if strings.HasSuffix(filename, ".bz2") || strings.HasSuffix(filename, ".bzip2") {
return bzip2.NewReader(reader), nil
}
}
return reader, nil
}