|
|
@ -27,30 +27,24 @@ print(df['duration_ms'])
|
|
|
|
|
|
|
|
|
|
|
|
df['duration_ms'] = pd.to_timedelta(df['duration_ms'], unit='ms')
|
|
|
|
df['duration_ms'] = pd.to_timedelta(df['duration_ms'], unit='ms')
|
|
|
|
df = df.rename(columns={"duration_ms": "duration_m"})
|
|
|
|
df = df.rename(columns={"duration_ms": "duration_m"})
|
|
|
|
# faire *60 /100 à la virgule
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# df['duration_m'] = df['duration_m'].round(2)
|
|
|
|
|
|
|
|
print(df['duration_m'])
|
|
|
|
print(df['duration_m'])
|
|
|
|
|
|
|
|
|
|
|
|
# test = pd.to_timedelta(df["duration_m"], unit="m")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# print(df['duration_m'].to_period('M'))
|
|
|
|
|
|
|
|
# print(test)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
# df = df.drop_duplicates()
|
|
|
|
|
|
|
|
# pas besoin car aucun titre en double
|
|
|
|
|
|
|
|
df = df.drop(151)
|
|
|
|
df = df.drop(151)
|
|
|
|
|
|
|
|
|
|
|
|
dfT = df[['track_id', 'track_name', 'track_popularity', 'duration_m', 'danceability', 'energy', 'loudness','speechiness', 'acousticness', 'liveness', 'valence', 'tempo', 'track_artist', 'track_album_id','track_artist']]
|
|
|
|
dfT = df[['track_id', 'track_name', 'track_popularity', 'duration_m', 'danceability', 'energy', 'loudness','speechiness', 'acousticness', 'liveness', 'valence', 'tempo', 'track_artist', 'track_album_id','playlist_id']]
|
|
|
|
dfA = df[['track_album_id', 'track_album_name', 'track_album_release_date', 'track_artist']]
|
|
|
|
dfA = df[['track_album_id', 'track_album_name', 'track_album_release_date', 'track_artist']]
|
|
|
|
dfP = df[['playlist_id', 'playlist_name', 'playlist_genre', 'playlist_subgenre']]
|
|
|
|
dfP = df[['playlist_id', 'playlist_name', 'playlist_genre', 'playlist_subgenre']]
|
|
|
|
dfArtist = df[['track_artist']]
|
|
|
|
dfArtist = df[['track_artist']]
|
|
|
|
dfArtist = dfArtist.drop_duplicates()
|
|
|
|
dfArtist = dfArtist.drop_duplicates()
|
|
|
|
dfA = dfA.drop_duplicates()
|
|
|
|
dfA = dfA.drop_duplicates()
|
|
|
|
dfA['track_album_id'] = dfA['track_album_id'].drop_duplicates()
|
|
|
|
dfA['track_album_id'] = dfA['track_album_id'].drop_duplicates()
|
|
|
|
|
|
|
|
dfA = dfA.dropna()
|
|
|
|
|
|
|
|
dfP = dfP.drop_duplicates()
|
|
|
|
|
|
|
|
dfP['playlist_id'] = dfP['playlist_id'].drop_duplicates()
|
|
|
|
|
|
|
|
dfP = dfP.dropna()
|
|
|
|
|
|
|
|
dfT = dfT.drop_duplicates()
|
|
|
|
|
|
|
|
dfT['track_id'] = dfT['track_id'].drop_duplicates()
|
|
|
|
|
|
|
|
dfT = dfT.dropna()
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
@ -67,7 +61,7 @@ try :
|
|
|
|
co.execute(text('''DROP TABLE IF EXISTS Album CASCADE;'''))
|
|
|
|
co.execute(text('''DROP TABLE IF EXISTS Album CASCADE;'''))
|
|
|
|
co.execute(text('''CREATE TABLE Album(
|
|
|
|
co.execute(text('''CREATE TABLE Album(
|
|
|
|
track_album_id varchar(150),
|
|
|
|
track_album_id varchar(150),
|
|
|
|
track_album_name varchar(150),
|
|
|
|
track_album_name varchar(500),
|
|
|
|
track_album_release_date varchar(15),
|
|
|
|
track_album_release_date varchar(15),
|
|
|
|
track_artist varchar(150) REFERENCES Artist,
|
|
|
|
track_artist varchar(150) REFERENCES Artist,
|
|
|
|
PRIMARY KEY (track_album_id)
|
|
|
|
PRIMARY KEY (track_album_id)
|
|
|
@ -75,11 +69,10 @@ try :
|
|
|
|
|
|
|
|
|
|
|
|
co.execute(text('''DROP TABLE IF EXISTS Playlist CASCADE;'''))
|
|
|
|
co.execute(text('''DROP TABLE IF EXISTS Playlist CASCADE;'''))
|
|
|
|
co.execute(text('''CREATE TABLE Playlist(
|
|
|
|
co.execute(text('''CREATE TABLE Playlist(
|
|
|
|
playlist_id varchar(150),
|
|
|
|
playlist_id varchar(150) PRIMARY KEY,
|
|
|
|
playlist_name varchar(150),
|
|
|
|
playlist_name varchar(150),
|
|
|
|
playlist_genre varchar(50),
|
|
|
|
playlist_genre varchar(50),
|
|
|
|
playlist_subgenre varchar(150),
|
|
|
|
playlist_subgenre varchar(150)
|
|
|
|
PRIMARY KEY (playlist_id)
|
|
|
|
|
|
|
|
);'''))
|
|
|
|
);'''))
|
|
|
|
|
|
|
|
|
|
|
|
co.execute(text('''DROP TABLE IF EXISTS Track CASCADE;'''))
|
|
|
|
co.execute(text('''DROP TABLE IF EXISTS Track CASCADE;'''))
|
|
|
@ -124,7 +117,7 @@ try :
|
|
|
|
co.execute(text('''INSERT INTO Track VALUES(:1, :2, :3, :4, :5, :6, :7, :8, :9, :10, :11, :12, :13, :14, :15);'''),
|
|
|
|
co.execute(text('''INSERT INTO Track VALUES(:1, :2, :3, :4, :5, :6, :7, :8, :9, :10, :11, :12, :13, :14, :15);'''),
|
|
|
|
{'1': row.track_id, '2': row.track_name, '3': row.track_popularity, '4': row.duration_m, '5': row.danceability, '6': row.energy, '7': row.loudness,
|
|
|
|
{'1': row.track_id, '2': row.track_name, '3': row.track_popularity, '4': row.duration_m, '5': row.danceability, '6': row.energy, '7': row.loudness,
|
|
|
|
'8': row.speechiness, '9': row.acousticness, '10': row.liveness, '11': row.valence, '12': row.tempo, '13': row.track_artist, '14': row.track_album_id,
|
|
|
|
'8': row.speechiness, '9': row.acousticness, '10': row.liveness, '11': row.valence, '12': row.tempo, '13': row.track_artist, '14': row.track_album_id,
|
|
|
|
'15': row.track_artist})
|
|
|
|
'15': row.playlist_id})
|
|
|
|
co.execute(text('''SELECT * FROM Track;'''))
|
|
|
|
co.execute(text('''SELECT * FROM Track;'''))
|
|
|
|
co.commit()
|
|
|
|
co.commit()
|
|
|
|
|
|
|
|
|
|
|
|