{ "data_id": "43603", "name": "IMDB_movie_1972-2019", "exact_name": "IMDB_movie_1972-2019", "version": 1, "version_label": "v1.0", "description": "Context\nThe IMDB Movies Dataset contains information about 5834 movies. Information about these movies was scraped from imdb for purpose of creating a movie recommendation model. The data was preprocessed and cleaned to be ready for machine learning applications.\nContent\n\nTitle\nYear\nRating\nMetascore\nVotes\nDescription\nGenre\nRuntime (Minutes)\nRevenue (Millions)\nActors\nDirector", "format": "arff", "uploader": "Dustin Carrion", "uploader_id": 30123, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-24 00:38:42", "update_comment": null, "last_update": "2022-03-24 00:38:42", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102428\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "IMDB_movie_1972-2019", "Context The IMDB Movies Dataset contains information about 5834 movies. Information about these movies was scraped from imdb for purpose of creating a movie recommendation model. The data was preprocessed and cleaned to be ready for machine learning applications. Content Title Year Rating Metascore Votes Description Genre Runtime (Minutes) Revenue (Millions) Actors Director " ], "weight": 5 }, "qualities": { "NumberOfInstances": 5834, "NumberOfFeatures": 12, "NumberOfClasses": null, "NumberOfMissingValues": 121, "NumberOfInstancesWithMissingValues": 99, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 0, "Dimensionality": 0.002056907781967775, "PercentageOfNumericFeatures": 58.333333333333336, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 1.6969489201234145, "AutoCorrelation": null, "PercentageOfMissingValues": 0.17283739001257 }, "tags": [ { "uploader": "38960", "tag": "Computer Systems" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "Unnamed:_0", "index": "0", "type": "numeric", "distinct": "5285", "missing": "0", "min": "0", "max": "5284", "mean": "2403", "stdev": "1631" }, { "name": "Title", "index": "1", "type": "string", "distinct": "5707", "missing": "0" }, { "name": "Year", "index": "2", "type": "numeric", "distinct": "48", "missing": "0", "min": "1972", "max": "2019", "mean": "2002", "stdev": "11" }, { "name": "Rating", "index": "3", "type": "numeric", "distinct": "74", "missing": "0", "min": "2", "max": "9", "mean": "6", "stdev": "1" }, { "name": "Metascore", "index": "4", "type": "numeric", "distinct": "97", "missing": "29", "min": "1", "max": "99", "mean": "55", "stdev": "18" }, { "name": "Votes", "index": "5", "type": "numeric", "distinct": "5666", "missing": "0", "min": "29", "max": "2182098", "mean": "89992", "stdev": "159060" }, { "name": "Description", "index": "6", "type": "string", "distinct": "5826", "missing": "0" }, { "name": "Genre", "index": "7", "type": "string", "distinct": "489", "missing": "0" }, { "name": "Runtime_(Minutes)", "index": "8", "type": "numeric", "distinct": "129", "missing": "0", "min": "48", "max": "317", "mean": "107", "stdev": "18" }, { "name": "Revenue_(Millions)", "index": "9", "type": "numeric", "distinct": "3552", "missing": "92", "min": "0", "max": "937", "mean": "40", "stdev": "66" }, { "name": "Actors", "index": "10", "type": "string", "distinct": "5789", "missing": "0" }, { "name": "Director", "index": "11", "type": "string", "distinct": "2733", "missing": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }