-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathsql_queries.py
158 lines (137 loc) · 3.98 KB
/
sql_queries.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
# DROP TABLES
songplay_table_drop = "DROP TABLE IF EXISTS songplays;"
user_table_drop = "DROP TABLE IF EXISTS users;"
song_table_drop = "DROP TABLE IF EXISTS songs;"
artist_table_drop = "DROP TABLE IF EXISTS artists;"
time_table_drop = "DROP TABLE IF EXISTS time;"
# CREATE TABLES
user_table_create = ("""
CREATE TABLE IF NOT EXISTS users
(user_id INT PRIMARY KEY UNIQUE NOT NULL,
first_name VARCHAR NOT NULL,
last_name VARCHAR NOT NULL,
gender CHAR,
level VARCHAR NOT NULL);
""")
song_table_create = ("""
CREATE TABLE IF NOT EXISTS songs
(song_id VARCHAR PRIMARY KEY UNIQUE NOT NULL,
title VARCHAR NOT NULL, artist_id VARCHAR NOT NULL,
artist_name VARCHAR NOT NULL,
year INT NOT NULL,
duration FLOAT8 NOT NULL);
""")
artist_table_create = ("""
CREATE TABLE IF NOT EXISTS artists
(artist_id VARCHAR PRIMARY KEY UNIQUE NOT NULL,
name VARCHAR NOT NULL,
location VARCHAR,
latitude FLOAT8,
longitude FLOAT8);
""")
time_table_create = ("""
CREATE TABLE IF NOT EXISTS time
(start_time BIGINT PRIMARY KEY NOT NULL,
hour VARCHAR NOT NULL,
day VARCHAR NOT NULL,
week VARCHAR NOT NULL,
month VARCHAR NOT NULL,
year VARCHAR NOT NULL,
weekday VARCHAR NOT NULL);
""")
songplay_table_create = ("""
CREATE TABLE IF NOT EXISTS songplays
(songplay_id SERIAL PRIMARY KEY UNIQUE NOT NULL,
start_time BIGINT NOT NULL,
session_id VARCHAR NOT NULL,
user_id INT NOT NULL,
song_id VARCHAR,
artist_id VARCHAR,
level VARCHAR NOT NULL,
location VARCHAR,
user_agent VARCHAR,
FOREIGN KEY (start_time) REFERENCES time (start_time),
FOREIGN KEY (song_id) REFERENCES songs (song_id),
FOREIGN KEY (user_id) REFERENCES users (user_id),
FOREIGN KEY (artist_id) REFERENCES artists (artist_id));
""")
# INSERT RECORDS
songplay_table_insert = ("""
INSERT INTO songplays
(start_time,
session_id,
user_id,
song_id,
artist_id,
level,
location,
user_agent)
VALUES
(%s, %s, %s, %s, %s, %s, %s, %s);
""")
# user table insertion
user_table_insert = ("""
INSERT INTO users
(user_id,
first_name,
last_name,
gender,
level)
VALUES
(%s, %s, %s, %s, %s)
ON CONFLICT (user_id)
DO UPDATE SET level = excluded.level;
""")
# song table insertion
song_table_insert = ("""
INSERT INTO songs
(song_id,
title,
artist_id,
artist_name,
year,
duration)
VALUES
(%s, %s, %s, %s, %s, %s)
ON CONFLICT (song_id)
DO UPDATE SET duration = excluded.duration;
""")
# song table insertion
artist_table_insert = ("""
INSERT INTO artists
(artist_id,
name,
location,
latitude,
longitude)
VALUES
(%s, %s, %s, %s, %s)
ON CONFLICT (artist_id)
DO UPDATE SEt name = excluded.name;
""")
# time table insert
time_table_insert = ("""
INSERT INTO time
(start_time,
hour,
day,
week,
month,
year,
weekday)
VALUES
(%s, %s, %s, %s, %s, %s, %s);
""")
# FIND SONGS
song_select = ("""
SELECT song_id, artist_id
FROM songs
WHERE title LIKE %s
AND artist_name LIKE %s
AND duration = %s
GROUP BY song_id,
artist_id;
""")
# QUERY LISTS
create_table_queries = [user_table_create, song_table_create, artist_table_create, time_table_create, songplay_table_create]
drop_table_queries = [songplay_table_drop, user_table_drop, song_table_drop, artist_table_drop, time_table_drop]