{ "data_id": "43517", "name": "Data-Science-YouTube-channels-Video-Metadata", "exact_name": "Data-Science-YouTube-channels-Video-Metadata", "version": 1, "version_label": "v1.0", "description": "Content\nThis dataset contains meta data of around 60 Data Science YouTube channel videos meta data.\nAcknowledgements\nData scraped from https:\/\/wiki.digitalmethods.net\/Dmi\/ToolDatabase .\nCover Photo: Photo by Rachit Tank on Unsplash.\nMotivation : Dataset by Gabriel Preda\nInspiration\nPossible uses for this dataset could include:\n\nSentiment analysis\/\nCategorising YouTube videos based on their comments and statistics.\nTraining ML algorithms like RNNs to generate their own YouTube description.\nMost popular data science youtube channel based on total likes, dislikes, votes counts.\nStatistical analysis over different channels_x000C_.\n\nFeel free to check notebook for other possible uses.", "format": "arff", "uploader": "Onur Yildirim", "uploader_id": 30126, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-23 13:32:16", "update_comment": null, "last_update": "2022-03-23 13:32:16", "licence": "CC BY-NC-SA 4.0", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102342\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Data-Science-YouTube-channels-Video-Metadata", "Content This dataset contains meta data of around 60 Data Science YouTube channel videos meta data. Acknowledgements Data scraped from https:\/\/wiki.digitalmethods.net\/Dmi\/ToolDatabase . Cover Photo: Photo by Rachit Tank on Unsplash. Motivation : Dataset by Gabriel Preda Inspiration Possible uses for this dataset could include: Sentiment analysis\/ Categorising YouTube videos based on their comments and statistics. Training ML algorithms like RNNs to generate their own YouTube description. Most po " ], "weight": 5 }, "qualities": { "NumberOfInstances": 44261, "NumberOfFeatures": 21, "NumberOfClasses": null, "NumberOfMissingValues": 47056, "NumberOfInstancesWithMissingValues": 31554, "NumberOfNumericFeatures": 8, "NumberOfSymbolicFeatures": 1, "Dimensionality": 0.00047445832674363435, "PercentageOfNumericFeatures": 38.095238095238095, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 4.761904761904762, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 1, "PercentageOfBinaryFeatures": 4.761904761904762, "PercentageOfInstancesWithMissingValues": 71.29075258127922, "AutoCorrelation": null, "PercentageOfMissingValues": 5.062610209353392 }, "tags": [ { "uploader": "38960", "tag": "Machine Learning" }, { "uploader": "38960", "tag": "Mathematics" } ], "features": [ { "name": "channelId", "index": "0", "type": "string", "distinct": "60", "missing": "0" }, { "name": "channelTitle", "index": "1", "type": "string", "distinct": "60", "missing": "0" }, { "name": "videoId", "index": "2", "type": "string", "distinct": "43709", "missing": "0" }, { "name": "publishedAt", "index": "3", "type": "string", "distinct": "36001", "missing": "0" }, { "name": "publishedAtSQL", "index": "4", "type": "string", "distinct": "32799", "missing": "0" }, { "name": "videoTitle", "index": "5", "type": "string", "distinct": "43777", "missing": "1" }, { "name": "videoDescription", "index": "6", "type": "string", "distinct": "36257", "missing": "482" }, { "name": "videoCategoryId", "index": "7", "type": "numeric", "distinct": "15", "missing": "1", "min": "1", "max": "29", "mean": "27", "stdev": "2" }, { "name": "videoCategoryLabel", "index": "8", "type": "string", "distinct": "15", "missing": "1" }, { "name": "duration", "index": "9", "type": "string", "distinct": "5769", "missing": "1" }, { "name": "durationSec", "index": "10", "type": "numeric", "distinct": "3506", "missing": "1", "min": "0", "max": "3599", "mean": "809", "stdev": "817" }, { "name": "dimension", "index": "11", "type": "string", "distinct": "1", "missing": "1" }, { "name": "definition", "index": "12", "type": "string", "distinct": "2", "missing": "1" }, { "name": "caption", "index": "13", "type": "nominal", "distinct": "2", "missing": "1", "distr": [] }, { "name": "thumbnail_maxres", "index": "14", "type": "string", "distinct": "34232", "missing": "10029" }, { "name": "licensedContent", "index": "15", "type": "numeric", "distinct": "1", "missing": "25450", "min": "1", "max": "1", "mean": "1", "stdev": "0" }, { "name": "viewCount", "index": "16", "type": "numeric", "distinct": "18914", "missing": "3", "min": "0", "max": "17787179", "mean": "32383", "stdev": "228805" }, { "name": "likeCount", "index": "17", "type": "numeric", "distinct": "3019", "missing": "859", "min": "0", "max": "432355", "mean": "539", "stdev": "5939" }, { "name": "dislikeCount", "index": "18", "type": "numeric", "distinct": "517", "missing": "859", "min": "0", "max": "12563", "mean": "15", "stdev": "146" }, { "name": "favoriteCount", "index": "19", "type": "numeric", "distinct": "1", "missing": "1", "min": "0", "max": "0", "mean": "0", "stdev": "0" }, { "name": "commentCount", "index": "20", "type": "numeric", "distinct": "873", "missing": "9365", "min": "0", "max": "25774", "mean": "48", "stdev": "389" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }