-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathsql_queries.py
99 lines (79 loc) · 3.22 KB
/
sql_queries.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
# DROP TABLES
songplay_table_drop = "DROP TABLE IF EXISTS songplays"
user_table_drop = "DROP TABLE IF EXISTS users"
song_table_drop = "DROP TABLE IF EXISTS songs"
artist_table_drop = "DROP TABLE IF EXISTS artists"
time_table_drop = "DROP TABLE IF EXISTS time"
# CREATE TABLES
songplay_table_create = ("""CREATE TABLE IF NOT EXISTS songplays(
songplay_id SERIAL CONSTRAINT songplay_pk PRIMARY KEY,
start_time TIMESTAMP REFERENCES time (start_time),
user_id INT REFERENCES users (user_id),
level VARCHAR NOT NULL,
song_id VARCHAR REFERENCES songs (song_id),
artist_id VARCHAR REFERENCES artists (artist_id),
session_id INT NOT NULL,
location VARCHAR,
user_agent TEXT
)""")
user_table_create = ("""CREATE TABLE IF NOT EXISTS users(
user_id INT CONSTRAINT users_pk PRIMARY KEY,
first_name VARCHAR,
last_name VARCHAR,
gender CHAR(1),
level VARCHAR NOT NULL
)""")
song_table_create = ("""CREATE TABLE IF NOT EXISTS songs(
song_id VARCHAR CONSTRAINT songs_pk PRIMARY KEY,
title VARCHAR,
artist_id VARCHAR REFERENCES artists (artist_id),
year INT CHECK (year >= 0),
duration FLOAT
)""")
artist_table_create = ("""CREATE TABLE IF NOT EXISTS artists(
artist_id VARCHAR CONSTRAINT artist_pk PRIMARY KEY,
name VARCHAR,
location VARCHAR,
latitude DECIMAL(9,6),
longitude DECIMAL(9,6)
)""")
time_table_create = ("""CREATE TABLE IF NOT EXISTS time(
start_time TIMESTAMP CONSTRAINT time_pk PRIMARY KEY,
hour INT NOT NULL CHECK (hour >= 0),
day INT NOT NULL CHECK (day >= 0),
week INT NOT NULL CHECK (week >= 0),
month INT NOT NULL CHECK (month >= 0),
year INT NOT NULL CHECK (year >= 0),
weekday VARCHAR NOT NULL
)""")
# INSERT RECORDS
songplay_table_insert = ("""INSERT INTO songplays VALUES (DEFAULT, %s, %s, %s, %s, %s, %s, %s, %s )
""")
# Updating the user level on conflict
user_table_insert = ("""INSERT INTO users (user_id, first_name, last_name, gender, level) VALUES (%s, %s, %s, %s, %s)
ON CONFLICT (user_id) DO UPDATE SET
level = EXCLUDED.level
""")
song_table_insert = ("""INSERT INTO songs (song_id, title, artist_id, year, duration) VALUES (%s, %s, %s, %s, %s)
ON CONFLICT (song_id) DO NOTHING
""")
# Artist location, latitude and longitude might change and need to be updated.
artist_table_insert = ("""INSERT INTO artists (artist_id, name, location, latitude, longitude) VALUES (%s, %s, %s, %s, %s)
ON CONFLICT (artist_id) DO UPDATE SET
location = EXCLUDED.location,
latitude = EXCLUDED.latitude,
longitude = EXCLUDED.longitude
""")
time_table_insert = ("""INSERT INTO time VALUES (%s, %s, %s, %s, %s, %s, %s) ON CONFLICT (start_time) DO NOTHING
""")
# FIND SONGS
song_select = ("""
SELECT song_id, artists.artist_id
FROM songs JOIN artists ON songs.artist_id = artists.artist_id
WHERE songs.title = %s
AND artists.name = %s
AND songs.duration = %s
""")
# QUERY LISTS
create_table_queries = [user_table_create, artist_table_create, song_table_create, time_table_create, songplay_table_create]
drop_table_queries = [songplay_table_drop, user_table_drop, song_table_drop, artist_table_drop, time_table_drop]