{ "data_id": "45028", "name": "california", "exact_name": "california", "version": 7, "version_label": null, "description": "Dataset used in the tabular data benchmark https:\/\/github.com\/LeoGrin\/tabular-benchmark, transformed in the same way. This dataset belongs to the \"classification on numerical features\" benchmark.\n Original source: https:\/\/www.dcc.fc.up.pt\/~ltorgo\/Regression\/cal_housing.html Please give credit to the original source if you use this dataset.", "format": "arff", "uploader": "Leo Grin", "uploader_id": 26324, "visibility": "public", "creator": "\"See source\"", "contributor": "\"Leo Grin\"", "date": "2023-01-03 16:13:55", "update_comment": null, "last_update": "2023-01-03 16:13:55", "licence": "See source", "status": "active", "error_message": null, "url": "https:\/\/api.openml.org\/data\/download\/22111914\/dataset", "default_target_attribute": "price_above_median", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "california", "Dataset used in the tabular data benchmark https:\/\/github.com\/LeoGrin\/tabular-benchmark, transformed in the same way. This dataset belongs to the \"classification on numerical features\" benchmark. Original source: https:\/\/www.dcc.fc.up.pt\/~ltorgo\/Regression\/cal_housing.html Please give credit to the original source if you use this dataset. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 20634, "NumberOfFeatures": 9, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 8, "NumberOfSymbolicFeatures": 1, "MinorityClassPercentage": 50, "MinorityClassSize": 10317, "NumberOfBinaryFeatures": 1, "PercentageOfBinaryFeatures": 11.11111111111111, "PercentageOfInstancesWithMissingValues": 0, "PercentageOfMissingValues": 0, "AutoCorrelation": 0.9999515339504677, "Dimensionality": 0.00043617330619366096, "PercentageOfNumericFeatures": 88.88888888888889, "MajorityClassPercentage": 50, "PercentageOfSymbolicFeatures": 11.11111111111111, "MajorityClassSize": 10317 }, "tags": [ { "uploader": "38960", "tag": "Demographics" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "price_above_median", "index": "8", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "0", "1" ], [ [ "10317", "0" ], [ "0", "10317" ] ] ] }, { "name": "MedInc", "index": "0", "type": "numeric", "distinct": "12925", "missing": "0", "min": "0", "max": "15", "mean": "4", "stdev": "2" }, { "name": "HouseAge", "index": "1", "type": "numeric", "distinct": "52", "missing": "0", "min": "1", "max": "52", "mean": "29", "stdev": "13" }, { "name": "AveRooms", "index": "2", "type": "numeric", "distinct": "19387", "missing": "0", "min": "1", "max": "142", "mean": "5", "stdev": "2" }, { "name": "AveBedrms", "index": "3", "type": "numeric", "distinct": "14229", "missing": "0", "min": "0", "max": "34", "mean": "1", "stdev": "0" }, { "name": "Population", "index": "4", "type": "numeric", "distinct": "3887", "missing": "0", "min": "3", "max": "35682", "mean": "1425", "stdev": "1132" }, { "name": "AveOccup", "index": "5", "type": "numeric", "distinct": "18837", "missing": "0", "min": "1", "max": "1243", "mean": "3", "stdev": "10" }, { "name": "Latitude", "index": "6", "type": "numeric", "distinct": "862", "missing": "0", "min": "33", "max": "42", "mean": "36", "stdev": "2" }, { "name": "Longitude", "index": "7", "type": "numeric", "distinct": "844", "missing": "0", "min": "-124", "max": "0", "mean": "-120", "stdev": "2" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }