{ "data_id": "42731", "name": "house_sales", "exact_name": "house_sales", "version": 3, "version_label": null, "description": "Date converted to year\/mo\/day numerics.This dataset contains house sale prices for King County, which includes Seattle. It includes homes sold between May 2014 and May 2015.\n\nIt contains 19 house features plus the price and the id columns, along with 21613 observations.\nIt's a great dataset for evaluating simple regression models.", "format": "arff", "uploader": "Pieter Gijsbers", "uploader_id": 869, "visibility": "public", "creator": "\"https:\/\/www.kaggle.com\/harlfoxem\/\"", "contributor": "\"https:\/\/www.kaggle.com\/harlfoxem\/\"", "date": "2020-11-18 08:51:57", "update_comment": null, "last_update": "2020-11-18 08:51:57", "licence": "CC0 Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22044765\/dataset", "default_target_attribute": "price", "row_id_attribute": "id", "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "house_sales", "Date converted to year\/mo\/day numerics.This dataset contains house sale prices for King County, which includes Seattle. It includes homes sold between May 2014 and May 2015. It contains 19 house features plus the price and the id columns, along with 21613 observations. It's a great dataset for evaluating simple regression models. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 21613, "NumberOfFeatures": 22, "NumberOfClasses": 0, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 21, "NumberOfSymbolicFeatures": 1, "Dimensionality": 0.001017905889973627, "PercentageOfNumericFeatures": 95.45454545454545, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 4.545454545454546, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "AutoCorrelation": -324979.41569498426, "PercentageOfMissingValues": 0 }, "tags": [ { "uploader": "38960", "tag": "Life Science" }, { "uploader": "38960", "tag": "Transportation" } ], "features": [ { "name": "price", "index": "1", "type": "numeric", "distinct": "4028", "missing": "0", "target": "1", "min": "75000", "max": "7700000", "mean": "540088", "stdev": "367127" }, { "name": "id", "index": "0", "type": "numeric", "distinct": "21436", "missing": "0", "identifier": "1", "min": "1000102", "max": "2147483647", "mean": "2147483647", "stdev": "2147483647" }, { "name": "bedrooms", "index": "2", "type": "numeric", "distinct": "13", "missing": "0", "min": "0", "max": "33", "mean": "3", "stdev": "1" }, { "name": "bathrooms", "index": "3", "type": "numeric", "distinct": "30", "missing": "0", "min": "0", "max": "8", "mean": "2", "stdev": "1" }, { "name": "sqft_living", "index": "4", "type": "numeric", "distinct": "1038", "missing": "0", "min": "290", "max": "13540", "mean": "2080", "stdev": "918" }, { "name": "sqft_lot", "index": "5", "type": "numeric", "distinct": "9782", "missing": "0", "min": "520", "max": "1651359", "mean": "15107", "stdev": "41421" }, { "name": "floors", "index": "6", "type": "numeric", "distinct": "6", "missing": "0", "min": "1", "max": "4", "mean": "1", "stdev": "1" }, { "name": "waterfront", "index": "7", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "view", "index": "8", "type": "numeric", "distinct": "5", "missing": "0", "min": "0", "max": "4", "mean": "0", "stdev": "1" }, { "name": "condition", "index": "9", "type": "numeric", "distinct": "5", "missing": "0", "min": "1", "max": "5", "mean": "3", "stdev": "1" }, { "name": "grade", "index": "10", "type": "numeric", "distinct": "12", "missing": "0", "min": "1", "max": "13", "mean": "8", "stdev": "1" }, { "name": "sqft_above", "index": "11", "type": "numeric", "distinct": "946", "missing": "0", "min": "290", "max": "9410", "mean": "1788", "stdev": "828" }, { "name": "sqft_basement", "index": "12", "type": "numeric", "distinct": "306", "missing": "0", "min": "0", "max": "4820", "mean": "292", "stdev": "443" }, { "name": "yr_built", "index": "13", "type": "numeric", "distinct": "116", "missing": "0", "min": "1900", "max": "2015", "mean": "1971", "stdev": "29" }, { "name": "yr_renovated", "index": "14", "type": "numeric", "distinct": "70", "missing": "0", "min": "0", "max": "2015", "mean": "84", "stdev": "402" }, { "name": "zipcode", "index": "15", "type": "nominal", "distinct": "70", "missing": "0", "distr": [] }, { "name": "lat", "index": "16", "type": "numeric", "distinct": "5034", "missing": "0", "min": "47", "max": "48", "mean": "48", "stdev": "0" }, { "name": "long", "index": "17", "type": "numeric", "distinct": "752", "missing": "0", "min": "-123", "max": "0", "mean": "-122", "stdev": "0" }, { "name": "sqft_living15", "index": "18", "type": "numeric", "distinct": "777", "missing": "0", "min": "399", "max": "6210", "mean": "1987", "stdev": "685" }, { "name": "sqft_lot15", "index": "19", "type": "numeric", "distinct": "8689", "missing": "0", "min": "651", "max": "871200", "mean": "12768", "stdev": "27304" }, { "name": "date_year", "index": "20", "type": "numeric", "distinct": "2", "missing": "0", "min": "2014", "max": "2015", "mean": "2014", "stdev": "0" }, { "name": "date_month", "index": "21", "type": "numeric", "distinct": "12", "missing": "0", "min": "1", "max": "12", "mean": "7", "stdev": "3" }, { "name": "date_day", "index": "22", "type": "numeric", "distinct": "31", "missing": "0", "min": "1", "max": "31", "mean": "16", "stdev": "9" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }