-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathsql_queries.py
94 lines (82 loc) · 4.56 KB
/
sql_queries.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
# DROP TABLE STATEMENTS
songplay_table_drop = "DROP TABLE IF EXISTS songplays"
user_table_drop = "DROP TABLE IF EXISTS users"
song_table_drop = "DROP TABLE IF EXISTS songs"
artist_table_drop = "DROP TABLE IF EXISTS artists"
time_table_drop = "DROP TABLE IF EXISTS time"
# CREATE TABLE STATEMENTS
songplay_table_create = ("""CREATE TABLE IF NOT EXISTS
songplays(songplay_id serial PRIMARY KEY,
start_time bigint REFERENCES time(start_time),
user_id integer NOT NULL REFERENCES users(user_id),
level varchar,
song_id char(19) NOT NULL REFERENCES songs(song_id),
artist_id char(19) NOT NULL REFERENCES artists(artist_id),
session_id integer NOT NULL,
location varchar,
user_agent text);
""")
user_table_create = ("""CREATE TABLE IF NOT EXISTS users(user_id integer PRIMARY KEY,
first_name varchar,
last_name varchar,
gender char(1),
level varchar);
""")
song_table_create = ("""CREATE TABLE IF NOT EXISTS songs(song_id char(19) PRIMARY KEY,
title text,
artist_id char(19) REFERENCES artists(artist_id),
year integer,
duration float);
""")
artist_table_create = ("""CREATE TABLE IF NOT EXISTS artists(artist_id char(19) PRIMARY KEY,
name varchar,
location varchar,
latitude varchar,
longitude varchar);
""")
time_table_create = ("""CREATE TABLE IF NOT EXISTS time(start_time bigint PRIMARY KEY,
hour integer,
day integer,
week integer,
month integer,
year integer,
weekday integer);
""")
# INSERT STATEMENTS
songplay_table_insert = ("""INSERT INTO songplays(start_time, user_id, level, song_id, artist_id, session_id, location, user_agent)
VALUES(%s,%s,%s,%s,%s,%s,%s,%s)
ON CONFLICT
DO NOTHING;
""")
user_table_insert = ("""INSERT INTO users(user_id, first_name, last_name, gender, level)
VALUES(%s,%s,%s,%s,%s)
ON CONFLICT
DO NOTHING;
""")
song_table_insert = ("""INSERT INTO songs(song_id, title, artist_id, year, duration)
VALUES(%s,%s,%s,%s,%s)
ON CONFLICT
DO NOTHING;
""")
artist_table_insert = ("""INSERT INTO artists(artist_id, name, location, latitude, longitude)
VALUES(%s,%s,%s,%s,%s)
ON CONFLICT
DO NOTHING;
""")
time_table_insert = ("""INSERT INTO time(start_time, hour, day, week, month, year, weekday)
VALUES(%s,%s,%s,%s,%s,%s,%s)
ON CONFLICT
DO NOTHING;
""")
# FIND SONG_ID AND ARTIST_ID FOR SONGPLAYS TABLE
song_select = ("""SELECT DISTINCT s.song_id, a.artist_id
FROM songs s
INNER JOIN artists a
ON (s.artist_id = a.artist_id)
WHERE s.title = %s
AND a.name = %s
AND s.duration = %s;
""")
# QUERY LISTS FOR EXECUTION
create_table_queries = [artist_table_create, user_table_create, song_table_create, time_table_create, songplay_table_create]
drop_table_queries = [songplay_table_drop, user_table_drop, song_table_drop, artist_table_drop, time_table_drop]