{ "data_id": "43901", "name": "click_prediction_small", "exact_name": "click_prediction_small", "version": 11, "version_label": null, "description": "Modified version of subsampled dataset from Tencent Inc. on OpenML. Duplicate rows are dropped. Columns with a high ratio of unique values are dropped. Some columns are cast to factor.", "format": "ARFF", "uploader": "Mine Gazioglu", "uploader_id": 30861, "visibility": "public", "creator": null, "contributor": null, "date": "2022-05-31 21:08:33", "update_comment": null, "last_update": "2022-05-31 21:08:33", "licence": "public", "status": "active", "error_message": null, "url": "https:\/\/old.openml.org\/data\/download\/22102809\/file414830787f10.arff", "kaggle_url": null, "default_target_attribute": "click", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "click_prediction_small", "Modified version of subsampled dataset from Tencent Inc. on OpenML. Duplicate rows are dropped. Columns with a high ratio of unique values are dropped. Some columns are cast to factor. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 39926, "NumberOfFeatures": 9, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 4, "NumberOfSymbolicFeatures": 5, "PercentageOfBinaryFeatures": 11.11111111111111, "PercentageOfInstancesWithMissingValues": 0, "PercentageOfMissingValues": 0, "AutoCorrelation": 0.7169192235441453, "PercentageOfNumericFeatures": 44.44444444444444, "Dimensionality": 0.00022541702148975605, "PercentageOfSymbolicFeatures": 55.55555555555556, "MajorityClassPercentage": 83.15633922757101, "MajorityClassSize": 33201, "MinorityClassPercentage": 16.843660772428994, "MinorityClassSize": 6725, "NumberOfBinaryFeatures": 1 }, "tags": [], "features": [ { "name": "click", "index": "0", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "0", "1" ], [ [ "33201", "0" ], [ "0", "6725" ] ] ] }, { "name": "impression", "index": "1", "type": "numeric", "distinct": "99", "missing": "0", "min": "1", "max": "11820", "mean": "2", "stdev": "66" }, { "name": "url_hash", "index": "2", "type": "numeric", "distinct": "6941", "missing": "0", "min": "2147483647", "max": "2147483647", "mean": "2147483647", "stdev": "2147483647" }, { "name": "ad_id", "index": "3", "type": "nominal", "distinct": "19228", "missing": "0", "distr": [] }, { "name": "advertiser_id", "index": "4", "type": "nominal", "distinct": "6064", "missing": "0", "distr": [] }, { "name": "depth", "index": "5", "type": "numeric", "distinct": "3", "missing": "0", "min": "1", "max": "3", "mean": "2", "stdev": "1" }, { "name": "position", "index": "6", "type": "numeric", "distinct": "3", "missing": "0", "min": "1", "max": "3", "mean": "1", "stdev": "1" }, { "name": "keyword_id", "index": "7", "type": "nominal", "distinct": "19803", "missing": "0", "distr": [] }, { "name": "description_id", "index": "8", "type": "nominal", "distinct": "22381", "missing": "0", "distr": [] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }