{ "data_id": "43386", "name": "Spotify---All-Time-Top-2000s-Mega-Dataset", "exact_name": "Spotify---All-Time-Top-2000s-Mega-Dataset", "version": 1, "version_label": "v1.0", "description": "Context\nThis dataset contains audio statistics of the top 2000 tracks on Spotify. The data contains about 15 columns each describing the track and it's qualities. Songs released from 1956 to 2019 are included from some notable and famous artists like Queen, The Beatles, Guns N' Roses, etc.\nhttp:\/\/sortyourmusic.playlistmachinery.com\/ by plamere uses Spotify API to extract the audio features from the tracks given the Spotify Playlist URI. This data contains audio features like Danceability, BPM, Liveness, Valence(Positivity) and many more.\nEach feature's description has been given in detail below.\nContent\n\nIndex: ID\nTitle: Name of the Track\nArtist: Name of the Artist\nTop Genre: Genre of the track\nYear: Release Year of the track\nBeats per Minute(BPM): The tempo of the song\nEnergy: The energy of a song - the higher the value, the more energtic. song\nDanceability: The higher the value, the easier it is to dance to this song.\nLoudness: The higher the value, the louder the song.\nValence: The higher the value, the more positive mood for the song.\nLength: The duration of the song.\nAcoustic: The higher the value the more acoustic the song is.\nSpeechiness: The higher the value the more spoken words the song contains\nPopularity: The higher the value the more popular the song is.\n\nAcknowledgements\nThis data is extracted from the Spotify playlist - Top 2000s on PlaylistMachinery(plamere) using Selenium with Python. More specifically, it was scraped from http:\/\/sortyourmusic.playlistmachinery.com\/. Thanks to Paul for providing a free and open source to extract features and do cool stuff with your Spotify playlists!\nInspiration\nThis is a very fun dataset to explore and find out unique links which land songs in the Top 2000s. With this dataset, I wanted to be able to answer some questions like:\n\nWhich genres were more popular coming through 1950s to 2000s?\nSongs of which genre mostly saw themselves landing in the Top 2000s?\nWhich artists were more likely to make a top song?\nSongs containing which words are more popular?\nWhat is the average tempo of songs compared over the years?\nIs there a trend of acoustic songs being popular back in 1960s than they are now?\nIs there a trend in genres preferred back in the day vs now?\n and a lot more.", "format": "arff", "uploader": "Onur Yildirim", "uploader_id": 30126, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-23 12:52:22", "update_comment": null, "last_update": "2022-03-23 12:52:22", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102211\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Spotify---All-Time-Top-2000s-Mega-Dataset", "Context This dataset contains audio statistics of the top 2000 tracks on Spotify. The data contains about 15 columns each describing the track and it's qualities. Songs released from 1956 to 2019 are included from some notable and famous artists like Queen, The Beatles, Guns N' Roses, etc. http:\/\/sortyourmusic.playlistmachinery.com\/ by plamere uses Spotify API to extract the audio features from the tracks given the Spotify Playlist URI. This data contains audio features like Danceability, BPM, L " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1994, "NumberOfFeatures": 15, "NumberOfClasses": null, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 11, "NumberOfSymbolicFeatures": 0, "Dimensionality": 0.007522567703109328, "PercentageOfNumericFeatures": 73.33333333333333, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "AutoCorrelation": null, "PercentageOfMissingValues": 0 }, "tags": [ { "uploader": "38960", "tag": "Computer Systems" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "Index", "index": "0", "type": "numeric", "distinct": "1994", "missing": "0", "min": "1", "max": "1994", "mean": "998", "stdev": "576" }, { "name": "Title", "index": "1", "type": "string", "distinct": "1958", "missing": "0" }, { "name": "Artist", "index": "2", "type": "string", "distinct": "731", "missing": "0" }, { "name": "Top_Genre", "index": "3", "type": "string", "distinct": "149", "missing": "0" }, { "name": "Year", "index": "4", "type": "numeric", "distinct": "63", "missing": "0", "min": "1956", "max": "2019", "mean": "1993", "stdev": "16" }, { "name": "Beats_Per_Minute_(BPM)", "index": "5", "type": "numeric", "distinct": "145", "missing": "0", "min": "37", "max": "206", "mean": "120", "stdev": "28" }, { "name": "Energy", "index": "6", "type": "numeric", "distinct": "98", "missing": "0", "min": "3", "max": "100", "mean": "60", "stdev": "22" }, { "name": "Danceability", "index": "7", "type": "numeric", "distinct": "84", "missing": "0", "min": "10", "max": "96", "mean": "53", "stdev": "15" }, { "name": "Loudness_(dB)", "index": "8", "type": "numeric", "distinct": "23", "missing": "0", "min": "-27", "max": "0", "mean": "-9", "stdev": "4" }, { "name": "Liveness", "index": "9", "type": "numeric", "distinct": "94", "missing": "0", "min": "2", "max": "99", "mean": "19", "stdev": "17" }, { "name": "Valence", "index": "10", "type": "numeric", "distinct": "97", "missing": "0", "min": "3", "max": "99", "mean": "49", "stdev": "25" }, { "name": "Length_(Duration)", "index": "11", "type": "string", "distinct": "350", "missing": "0" }, { "name": "Acousticness", "index": "12", "type": "numeric", "distinct": "100", "missing": "0", "min": "0", "max": "99", "mean": "29", "stdev": "29" }, { "name": "Speechiness", "index": "13", "type": "numeric", "distinct": "37", "missing": "0", "min": "2", "max": "55", "mean": "5", "stdev": "4" }, { "name": "Popularity", "index": "14", "type": "numeric", "distinct": "81", "missing": "0", "min": "11", "max": "100", "mean": "60", "stdev": "14" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }