diff --git a/test_Rémi b/test_Rémi index 71595ee..b570396 100644 --- a/test_Rémi +++ b/test_Rémi @@ -27,30 +27,24 @@ print(df['duration_ms']) df['duration_ms'] = pd.to_timedelta(df['duration_ms'], unit='ms') df = df.rename(columns={"duration_ms": "duration_m"}) -# faire *60 /100 à la virgule - -# df['duration_m'] = df['duration_m'].round(2) print(df['duration_m']) -# test = pd.to_timedelta(df["duration_m"], unit="m") - - -# print(df['duration_m'].to_period('M')) -# print(test) - - -# df = df.drop_duplicates() -# pas besoin car aucun titre en double df = df.drop(151) -dfT = df[['track_id', 'track_name', 'track_popularity', 'duration_m', 'danceability', 'energy', 'loudness','speechiness', 'acousticness', 'liveness', 'valence', 'tempo', 'track_artist', 'track_album_id','track_artist']] +dfT = df[['track_id', 'track_name', 'track_popularity', 'duration_m', 'danceability', 'energy', 'loudness','speechiness', 'acousticness', 'liveness', 'valence', 'tempo', 'track_artist', 'track_album_id','playlist_id']] dfA = df[['track_album_id', 'track_album_name', 'track_album_release_date', 'track_artist']] dfP = df[['playlist_id', 'playlist_name', 'playlist_genre', 'playlist_subgenre']] dfArtist = df[['track_artist']] dfArtist = dfArtist.drop_duplicates() dfA = dfA.drop_duplicates() dfA['track_album_id'] = dfA['track_album_id'].drop_duplicates() - +dfA = dfA.dropna() +dfP = dfP.drop_duplicates() +dfP['playlist_id'] = dfP['playlist_id'].drop_duplicates() +dfP = dfP.dropna() +dfT = dfT.drop_duplicates() +dfT['track_id'] = dfT['track_id'].drop_duplicates() +dfT = dfT.dropna() @@ -67,7 +61,7 @@ try : co.execute(text('''DROP TABLE IF EXISTS Album CASCADE;''')) co.execute(text('''CREATE TABLE Album( track_album_id varchar(150), - track_album_name varchar(150), + track_album_name varchar(500), track_album_release_date varchar(15), track_artist varchar(150) REFERENCES Artist, PRIMARY KEY (track_album_id) @@ -75,11 +69,10 @@ try : co.execute(text('''DROP TABLE IF EXISTS Playlist CASCADE;''')) co.execute(text('''CREATE TABLE Playlist( - playlist_id varchar(150), + playlist_id varchar(150) PRIMARY KEY, playlist_name varchar(150), playlist_genre varchar(50), - playlist_subgenre varchar(150), - PRIMARY KEY (playlist_id) + playlist_subgenre varchar(150) );''')) co.execute(text('''DROP TABLE IF EXISTS Track CASCADE;''')) @@ -124,7 +117,7 @@ try : co.execute(text('''INSERT INTO Track VALUES(:1, :2, :3, :4, :5, :6, :7, :8, :9, :10, :11, :12, :13, :14, :15);'''), {'1': row.track_id, '2': row.track_name, '3': row.track_popularity, '4': row.duration_m, '5': row.danceability, '6': row.energy, '7': row.loudness, '8': row.speechiness, '9': row.acousticness, '10': row.liveness, '11': row.valence, '12': row.tempo, '13': row.track_artist, '14': row.track_album_id, - '15': row.track_artist}) + '15': row.playlist_id}) co.execute(text('''SELECT * FROM Track;''')) co.commit()