{ "data_id": "43532", "name": "The-Social-Dilemma-Tweets---Text-Classification", "exact_name": "The-Social-Dilemma-Tweets---Text-Classification", "version": 1, "version_label": "v1.0", "description": "Context\nThe Social Dilemma, a documentary-drama hybrid explores the dangerous human impact of social networking, with tech experts sounding the alarm on their own creations as the tech experts sound the alarm on the dangerous human impact of social networking.\nInitial release: January 2020\nDirector: Jeff Orlowski\nProducer: Larissa Rhodes\nMusic director: Mark A. Crawford\nScreenplay: Jeff Orlowski, Vickie Curtis, Davis Coombe\nContent\nThis dataset brings you the twitter responses made with the TheSocialDilemma hashtag after watching the eye-opening documentary \"The Social Dilemma\" released in an OTT platform(Netflix) on September 9th, 2020.\nThe dataset was extracted using TwitterAPI, consisting of nearly 10,526 tweets from twitter users all over the globe!\n\n\n\nNo\nColumns\nDescriptions\n\n\n\n\n1\nuser_name\nThe name of the user, as theyve defined it.\n\n\n2\nuser_location\nThe user-defined location for this accounts profile.\n\n\n3\nuser_description\nThe user-defined UTF-8 string describing their account.\n\n\n4\nuser_created\nTime and date, when the account was created.\n\n\n5\nuser_followers\nThe number of followers an account currently has.\n\n\n6\nuser_friends\nThe number of friends an account currently has.\n\n\n7\nuser_favourites\nThe number of favorites a account currently has\n\n\n8\nuser_verified\nWhen true, indicates that the user has a verified account\n\n\n9\ndate\nUTC time and date when the Tweet was created\n\n\n10\ntext\nThe actual UTF-8 text of the Tweet\n\n\n11\nhashtags\nAll the other hashtags posted in the tweet along with TheSocialDilemma\n\n\n12\nsource\nUtility used to post the Tweet, Tweets from the Twitter website have a source value - web\n\n\n13\nis_retweet\nIndicates whether this Tweet has been Retweeted by the authenticating user.\n\n\n14\nSentiment(Target variable)\nIndicates the sentiment of the tweet, consists of three categories: Positive, neutral, and negative\n\n\n\nInspiration\nYou can use this data to dive into the subjects that use this hashtag, look to the geographical distribution, evaluate sentiments, looks to trends.", "format": "arff", "uploader": "Onur Yildirim", "uploader_id": 30126, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-23 13:44:54", "update_comment": null, "last_update": "2022-03-23 13:44:54", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102357\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "The-Social-Dilemma-Tweets---Text-Classification", "Context The Social Dilemma, a documentary-drama hybrid explores the dangerous human impact of social networking, with tech experts sounding the alarm on their own creations as the tech experts sound the alarm on the dangerous human impact of social networking. Initial release: January 2020 Director: Jeff Orlowski Producer: Larissa Rhodes Music director: Mark A. Crawford Screenplay: Jeff Orlowski, Vickie Curtis, Davis Coombe Content This dataset brings you the twitter responses made with the TheS " ], "weight": 5 }, "qualities": { "NumberOfInstances": 20068, "NumberOfFeatures": 14, "NumberOfClasses": null, "NumberOfMissingValues": 10429, "NumberOfInstancesWithMissingValues": 8638, "NumberOfNumericFeatures": 3, "NumberOfSymbolicFeatures": 2, "Dimensionality": 0.0006976280645804266, "PercentageOfNumericFeatures": 21.428571428571427, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 14.285714285714285, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 2, "PercentageOfBinaryFeatures": 14.285714285714285, "PercentageOfInstancesWithMissingValues": 43.04365158461232, "AutoCorrelation": null, "PercentageOfMissingValues": 3.7120219824026877 }, "tags": [ { "uploader": "38960", "tag": "Computer Systems" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "user_name", "index": "0", "type": "string", "distinct": "15184", "missing": "328" }, { "name": "user_location", "index": "1", "type": "string", "distinct": "5652", "missing": "4293" }, { "name": "user_description", "index": "2", "type": "string", "distinct": "14724", "missing": "1511" }, { "name": "user_created", "index": "3", "type": "string", "distinct": "16109", "missing": "0" }, { "name": "user_followers", "index": "4", "type": "numeric", "distinct": "4141", "missing": "0", "min": "0", "max": "15624426", "mean": "8805", "stdev": "154001" }, { "name": "user_friends", "index": "5", "type": "numeric", "distinct": "3220", "missing": "0", "min": "0", "max": "288625", "mean": "1117", "stdev": "5170" }, { "name": "user_favourites", "index": "6", "type": "numeric", "distinct": "9945", "missing": "0", "min": "0", "max": "708749", "mean": "13937", "stdev": "30438" }, { "name": "user_verified", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "distr": [] }, { "name": "date", "index": "8", "type": "string", "distinct": "19811", "missing": "0" }, { "name": "text", "index": "9", "type": "string", "distinct": "19804", "missing": "0" }, { "name": "hashtags", "index": "10", "type": "string", "distinct": "1753", "missing": "4297" }, { "name": "source", "index": "11", "type": "string", "distinct": "82", "missing": "0" }, { "name": "is_retweet", "index": "12", "type": "nominal", "distinct": "1", "missing": "0", "distr": [] }, { "name": "Sentiment", "index": "13", "type": "string", "distinct": "3", "missing": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }