-
Notifications
You must be signed in to change notification settings - Fork 542
/
prepare_data.sh
executable file
·52 lines (45 loc) · 1.09 KB
/
prepare_data.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
#! /bin/bash
# Configuration
DB_NAME=deepdive_ocr
cd `dirname $0`
BASE_DIR=`pwd`
dropdb $DB_NAME
createdb $DB_NAME
psql -c """
DROP SCHEMA IF EXISTS public CASCADE;
CREATE SCHEMA public;
""" $DB_NAME
psql -c """
CREATE TABLE features(
id BIGSERIAL PRIMARY KEY,
word_id INT,
feature_id INT,
feature_val BOOLEAN);
""" $DB_NAME
psql -c """
CREATE TABLE feature_names(
fid INT PRIMARY KEY,
fname VARCHAR(20));
""" $DB_NAME
psql -c """
CREATE TABLE label1(
wid INT, val BOOLEAN,
id BIGINT);
""" $DB_NAME
psql -c """
CREATE TABLE label2(
wid INT, val BOOLEAN,
id BIGINT);
""" $DB_NAME
psql -c """
COPY features(word_id, feature_id, feature_val)
FROM STDIN DELIMITER ',' CSV;
""" $DB_NAME <$BASE_DIR/data/raw/feature_table.csv
psql -c """
COPY label1(wid, val)
FROM STDIN DELIMITER ',' CSV;
""" $DB_NAME <$BASE_DIR/data/raw/label1_table.csv
psql -c """
COPY label2(wid, val)
FROM STDIN DELIMITER ',' CSV;
""" $DB_NAME <$BASE_DIR/data/raw/label2_table.csv