{ "cells": [ { "cell_type": "code", "execution_count": null, "metadata": { "id": "K6Ek26jtEbzM" }, "outputs": [], "source": [ "import pandas as pd" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { "id": "jSok_FhgFQPa" }, "outputs": [], "source": [ "df = pd.read_csv('data/data.csv')" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "Index(['valence', 'year', 'acousticness', 'artists', 'danceability',\n", " 'duration_ms', 'energy', 'explicit', 'id', 'instrumentalness', 'key',\n", " 'liveness', 'loudness', 'mode', 'name', 'popularity', 'release_date',\n", " 'speechiness', 'tempo'],\n", " dtype='object')" ] }, "execution_count": 3, "metadata": {}, "output_type": "execute_result" } ], "source": [ "df.columns" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [], "source": [ "selected_columns = ['valence', 'year', 'acousticness', 'artists', 'danceability',\n", " 'duration_ms', 'energy','id', 'instrumentalness', 'key',\n", " 'liveness', 'loudness', 'mode', 'name', 'popularity',\n", " 'speechiness', 'tempo']\n" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [ "df.to_csv('data/data_clean.csv', columns=selected_columns, index=False)" ] }, { "cell_type": "code", "execution_count": 5, "metadata": {}, "outputs": [ { "data": { "text/html": [ "
\n", " | valence | \n", "year | \n", "acousticness | \n", "artists | \n", "danceability | \n", "duration_ms | \n", "energy | \n", "explicit | \n", "id | \n", "instrumentalness | \n", "key | \n", "liveness | \n", "loudness | \n", "mode | \n", "name | \n", "popularity | \n", "release_date | \n", "speechiness | \n", "tempo | \n", "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | \n", "0.0594 | \n", "1921 | \n", "0.982 | \n", "['Sergei Rachmaninoff', 'James Levine', 'Berli... | \n", "0.279 | \n", "831667 | \n", "0.211 | \n", "0 | \n", "4BJqT0PrAfrxzMOxytFOIz | \n", "0.878000 | \n", "10 | \n", "0.665 | \n", "-20.096 | \n", "1 | \n", "Piano Concerto No. 3 in D Minor, Op. 30: III. ... | \n", "4 | \n", "1921 | \n", "0.0366 | \n", "80.954 | \n", "
1 | \n", "0.9630 | \n", "1921 | \n", "0.732 | \n", "['Dennis Day'] | \n", "0.819 | \n", "180533 | \n", "0.341 | \n", "0 | \n", "7xPhfUan2yNtyFG0cUWkt8 | \n", "0.000000 | \n", "7 | \n", "0.160 | \n", "-12.441 | \n", "1 | \n", "Clancy Lowered the Boom | \n", "5 | \n", "1921 | \n", "0.4150 | \n", "60.936 | \n", "
2 | \n", "0.0394 | \n", "1921 | \n", "0.961 | \n", "['KHP Kridhamardawa Karaton Ngayogyakarta Hadi... | \n", "0.328 | \n", "500062 | \n", "0.166 | \n", "0 | \n", "1o6I8BglA6ylDMrIELygv1 | \n", "0.913000 | \n", "3 | \n", "0.101 | \n", "-14.850 | \n", "1 | \n", "Gati Bali | \n", "5 | \n", "1921 | \n", "0.0339 | \n", "110.339 | \n", "
3 | \n", "0.1650 | \n", "1921 | \n", "0.967 | \n", "['Frank Parker'] | \n", "0.275 | \n", "210000 | \n", "0.309 | \n", "0 | \n", "3ftBPsC5vPBKxYSee08FDH | \n", "0.000028 | \n", "5 | \n", "0.381 | \n", "-9.316 | \n", "1 | \n", "Danny Boy | \n", "3 | \n", "1921 | \n", "0.0354 | \n", "100.109 | \n", "
4 | \n", "0.2530 | \n", "1921 | \n", "0.957 | \n", "['Phil Regan'] | \n", "0.418 | \n", "166693 | \n", "0.193 | \n", "0 | \n", "4d6HGyGT8e121BsdKmw9v6 | \n", "0.000002 | \n", "3 | \n", "0.229 | \n", "-10.096 | \n", "1 | \n", "When Irish Eyes Are Smiling | \n", "2 | \n", "1921 | \n", "0.0380 | \n", "101.665 | \n", "