{ "data_id": "42092", "name": "house_sales", "exact_name": "house_sales", "version": 2, "version_label": "0.1", "description": "This dataset contains house sale prices for King County, which includes Seattle. It includes homes sold between May 2014 and May 2015.\n\nIt contains 19 house features plus the price and the id columns, along with 21613 observations.\nIt's a great dataset for evaluating simple regression models.", "format": "arff", "uploader": "Thomas Schmitt", "uploader_id": 3422, "visibility": "public", "creator": "https:\/\/www.kaggle.com\/harlfoxem\/", "contributor": "\"https:\/\/www.kaggle.com\/harlfoxem\/\"", "date": "2019-08-19 12:09:01", "update_comment": null, "last_update": "2019-08-19 12:09:01", "licence": "CC0 Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/21578898\/dataset", "default_target_attribute": "price", "row_id_attribute": "id", "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "house_sales", "This dataset contains house sale prices for King County, which includes Seattle. It includes homes sold between May 2014 and May 2015. It contains 19 house features plus the price and the id columns, along with 21613 observations. It's a great dataset for evaluating simple regression models. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 21613, "NumberOfFeatures": 20, "NumberOfClasses": 0, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 18, "NumberOfSymbolicFeatures": 1, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 70, "PercentageOfNumericFeatures": 90, "Quartile3MeansOfNumericAtts": 2009.889302734465, "MaxNominalAttDistinctValues": 70, "MinSkewnessOfNumericAtts": -0.48527047653794136, "PercentageOfSymbolicFeatures": 5, "Quartile3MutualInformation": null, "MaxSkewnessOfNumericAtts": 13.060018959032032, "MinStdDevOfNumericAtts": 0.0865171977279032, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 4.1554252002624565, "MaxStdDevOfNumericAtts": 367127.19648269983, "MinorityClassPercentage": null, "Quartile1KurtosisOfNumericAtts": 0.9185665567918385, "Quartile3StdDevOfNumericAtts": 850.6784575006379, "MeanAttributeEntropy": null, "MinorityClassSize": null, "Quartile1MeansOfNumericAtts": 1.9596452366631323, "StdvNominalAttDistinctValues": 0, "MeanKurtosisOfNumericAtts": 38.439028493829476, "NumberOfBinaryFeatures": 0, "Quartile1MutualInformation": null, "MeanMeansOfNumericAtts": 32006.053252985756, "Quartile1SkewnessOfNumericAtts": 0.7323715808576188, "AutoCorrelation": -324979.41569498426, "MeanMutualInformation": null, "Quartile1StdDevOfNumericAtts": 0.6230545085602959, "ClassEntropy": null, "MeanNoiseToSignalRatio": null, "Quartile2AttributeEntropy": null, "Dimensionality": 0.0009253689908851155, "MeanNominalAttDistinctValues": 70, "Quartile2KurtosisOfNumericAtts": 3.05893891640625, "EquivalentNumberOfAtts": null, "MeanSkewnessOfNumericAtts": 3.1311676256089784, "Quartile2MeansOfNumericAtts": 65.98115520982819, "MajorityClassPercentage": null, "MeanStdDevOfNumericAtts": 24397.924285785033, "Quartile2MutualInformation": null, "MajorityClassSize": null, "MinAttributeEntropy": null, "Quartile2SkewnessOfNumericAtts": 1.4591099500919529, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -0.6763130016125789, "PercentageOfBinaryFeatures": 0, "Quartile2StdDevOfNumericAtts": 15.274434779682242, "MaxKurtosisOfNumericAtts": 285.07781969737005, "MinMeansOfNumericAtts": -122.21389640494147, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "MaxMeansOfNumericAtts": 540088.1417665279, "MinMutualInformation": null, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 38.20506861937859 }, "tags": [ { "tag": "Computer Systems", "uploader": "38960" }, { "tag": "Education", "uploader": "38960" } ], "features": [ { "name": "price", "index": "2", "type": "numeric", "distinct": "4028", "missing": "0", "target": "1", "min": "75000", "max": "7700000", "mean": "540088", "stdev": "367127" }, { "name": "id", "index": "0", "type": "numeric", "distinct": "21436", "missing": "0", "identifier": "1", "min": "1000102", "max": "2147483647", "mean": "2147483647", "stdev": "2147483647" }, { "name": "date", "index": "1", "type": "string", "distinct": "372", "missing": "0" }, { "name": "bedrooms", "index": "3", "type": "numeric", "distinct": "13", "missing": "0", "min": "0", "max": "33", "mean": "3", "stdev": "1" }, { "name": "bathrooms", "index": "4", "type": "numeric", "distinct": "30", "missing": "0", "min": "0", "max": "8", "mean": "2", "stdev": "1" }, { "name": "sqft_living", "index": "5", "type": "numeric", "distinct": "1038", "missing": "0", "min": "290", "max": "13540", "mean": "2080", "stdev": "918" }, { "name": "sqft_lot", "index": "6", "type": "numeric", "distinct": "9782", "missing": "0", "min": "520", "max": "1651359", "mean": "15107", "stdev": "41421" }, { "name": "floors", "index": "7", "type": "numeric", "distinct": "6", "missing": "0", "min": "1", "max": "4", "mean": "1", "stdev": "1" }, { "name": "waterfront", "index": "8", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "view", "index": "9", "type": "numeric", "distinct": "5", "missing": "0", "min": "0", "max": "4", "mean": "0", "stdev": "1" }, { "name": "condition", "index": "10", "type": "numeric", "distinct": "5", "missing": "0", "min": "1", "max": "5", "mean": "3", "stdev": "1" }, { "name": "grade", "index": "11", "type": "numeric", "distinct": "12", "missing": "0", "min": "1", "max": "13", "mean": "8", "stdev": "1" }, { "name": "sqft_above", "index": "12", "type": "numeric", "distinct": "946", "missing": "0", "min": "290", "max": "9410", "mean": "1788", "stdev": "828" }, { "name": "sqft_basement", "index": "13", "type": "numeric", "distinct": "306", "missing": "0", "min": "0", "max": "4820", "mean": "292", "stdev": "443" }, { "name": "yr_built", "index": "14", "type": "numeric", "distinct": "116", "missing": "0", "min": "1900", "max": "2015", "mean": "1971", "stdev": "29" }, { "name": "yr_renovated", "index": "15", "type": "numeric", "distinct": "70", "missing": "0", "min": "0", "max": "2015", "mean": "84", "stdev": "402" }, { "name": "zipcode", "index": "16", "type": "nominal", "distinct": "70", "missing": "0", "distr": [] }, { "name": "lat", "index": "17", "type": "numeric", "distinct": "5034", "missing": "0", "min": "47", "max": "48", "mean": "48", "stdev": "0" }, { "name": "long", "index": "18", "type": "numeric", "distinct": "752", "missing": "0", "min": "-123", "max": "0", "mean": "-122", "stdev": "0" }, { "name": "sqft_living15", "index": "19", "type": "numeric", "distinct": "777", "missing": "0", "min": "399", "max": "6210", "mean": "1987", "stdev": "685" }, { "name": "sqft_lot15", "index": "20", "type": "numeric", "distinct": "8689", "missing": "0", "min": "651", "max": "871200", "mean": "12768", "stdev": "27304" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 4, "total_downloads": 14, "reach": 4, "reuse": 9, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 9 }