forked from xitongsys/parquet-go-source
/
memfs_write.go
108 lines (98 loc) · 2.69 KB
/
memfs_write.go
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
package main
import (
"io"
"io/ioutil"
"log"
"os"
"time"
"github.com/xitongsys/parquet-go-source/mem"
"github.com/xitongsys/parquet-go-source/local"
"github.com/xitongsys/parquet-go/reader"
"github.com/xitongsys/parquet-go/writer"
"github.com/xitongsys/parquet-go/parquet"
)
type Student struct {
Name string `parquet:"name=name, type=UTF8, encoding=PLAIN_DICTIONARY"`
Age int32 `parquet:"name=age, type=INT32"`
Id int64 `parquet:"name=id, type=INT64"`
Weight float32 `parquet:"name=weight, type=FLOAT"`
Sex bool `parquet:"name=sex, type=BOOLEAN"`
Day int32 `parquet:"name=day, type=DATE"`
}
func main() {
// create in-memory ParquetFile with Closer Function
// NOTE: closer function can be nil, no action will be
// run when the writer is closed.
fw, err := mem.NewMemFileWriter("flat.parquet.snappy", func(name string, r io.Reader) error {
dat, err := ioutil.ReadAll(r)
if err != nil {
log.Printf("error reading data: %v", err)
os.Exit(1)
}
// write file to disk
if err := ioutil.WriteFile(name, dat, 0644); err != nil {
log.Printf("error writing result file: %v", err)
}
return nil
})
if err != nil {
log.Println("Can't create local file", err)
return
}
//write
pw, err := writer.NewParquetWriter(fw, new(Student), 4)
if err != nil {
log.Println("Can't create parquet writer", err)
return
}
pw.RowGroupSize = 128 * 1024 * 1024 //128M
pw.CompressionType = parquet.CompressionCodec_SNAPPY
num := 10
for i := 0; i < num; i++ {
stu := Student{
Name: "StudentName",
Age: int32(20 + i%5),
Id: int64(i),
Weight: float32(50.0 + float32(i)*0.1),
Sex: bool(i%2 == 0),
Day: int32(time.Now().Unix() / 3600 / 24),
}
if err = pw.Write(stu); err != nil {
log.Println("Write error", err)
}
}
if err = pw.WriteStop(); err != nil {
log.Println("WriteStop error", err)
return
}
log.Println("Write Finished")
fw.Close()
// os.Exit(1)
///read
fr, err := local.NewLocalFileReader("flat.parquet.snappy")
if err != nil {
log.Println("Can't open file")
return
}
pr, err := reader.NewParquetReader(fr, new(Student), 4)
if err != nil {
log.Println("Can't create parquet reader", err)
return
}
num = int(pr.GetNumRows())
for i := 0; i < num; i++ {
stus := make([]Student, 1)
if err = pr.Read(&stus); err != nil {
log.Println("Read error", err)
}
log.Println(stus)
}
pr.ReadStop()
fr.Close()
// NOTE: you can access the underlying MemFs using ParquetFile.GetMemFileFs()
// EXAMPLE: this will delete the file we created from the in-memory file system
if err := mem.GetMemFileFs().Remove("flat.parquet.snappy"); err != nil {
log.Printf("error removing file from memfs: %v", err)
os.Exit(1)
}
}