{ "data_id": "853", "name": "boston", "exact_name": "boston", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:35:22", "update_comment": null, "last_update": "2014-10-04 14:35:22", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53387\/housing.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 734, "suggest": { "input": [ "boston", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 506, "NumberOfFeatures": 14, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 12, "NumberOfSymbolicFeatures": 2, "REPTreeDepth3Kappa": 0.706664271600503, "DecisionStumpKappa": 0.6251119469819094, "MaxMeansOfNumericAtts": 408.23715415019797, "MinMutualInformation": 0.00544370659686, "Quartile2SkewnessOfNumericAtts": 0.6996319321649427, "RandomTreeDepth1AUC": 0.7869041290093921, "Dimensionality": 0.02766798418972332, "MaxMutualInformation": 0.00544370659686, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 14.285714285714285, "Quartile2StdDevOfNumericAtts": 7.87130330834053, "RandomTreeDepth1ErrRate": 0.20355731225296442, "EquivalentNumberOfAtts": 179.67003797332868, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -2.8903737121414426, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": 0.3628184439419491, "RandomTreeDepth1Kappa": 0.5774924201890493, "J48.00001.AUC": 0.8541394809337393, "MaxSkewnessOfNumericAtts": 5.223148798243853, "MinStdDevOfNumericAtts": 0.11587767566755611, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 3.496507654429232, "AutoCorrelation": 0.8, "RandomTreeDepth2AUC": 0.7869041290093921, "J48.00001.ErrRate": 0.1857707509881423, "MaxStdDevOfNumericAtts": 168.5371160549593, "MinorityClassPercentage": 41.30434782608695, "PercentageOfNumericFeatures": 85.71428571428571, "Quartile3MeansOfNumericAtts": 56.04505928853756, "CfsSubsetEval_DecisionStumpAUC": 0.9030415800750728, "RandomTreeDepth2ErrRate": 0.20355731225296442, "J48.00001.Kappa": 0.6113607765594103, "MeanAttributeEntropy": 0.3628184439419491, "MinorityClassSize": 209, "PercentageOfSymbolicFeatures": 14.285714285714285, "Quartile3MutualInformation": 0.00544370659686, "CfsSubsetEval_DecisionStumpErrRate": 0.16205533596837945, "RandomTreeDepth2Kappa": 0.5774924201890493, "J48.0001.AUC": 0.8541394809337393, "MeanKurtosisOfNumericAtts": 3.8917386725495886, "NaiveBayesAUC": 0.8540731144746122, "Quartile1AttributeEntropy": 0.3628184439419491, "Quartile3SkewnessOfNumericAtts": 1.0100390965302286, "CfsSubsetEval_DecisionStumpKappa": 0.6619465854095716, "RandomTreeDepth3AUC": 0.7869041290093921, "J48.0001.ErrRate": 0.1857707509881423, "MeanMeansOfNumericAtts": 75.90770013504614, "NaiveBayesErrRate": 0.2450592885375494, "Quartile1KurtosisOfNumericAtts": -0.9425946940228838, "Quartile3StdDevOfNumericAtts": 26.942259303806473, "CfsSubsetEval_NaiveBayesAUC": 0.9030415800750728, "RandomTreeDepth3ErrRate": 0.20355731225296442, "J48.0001.Kappa": 0.6113607765594103, "MeanMutualInformation": 0.00544370659686, "NaiveBayesKappa": 0.519784475500926, "Quartile1MeansOfNumericAtts": 4.417440612648221, "REPTreeDepth1AUC": 0.8852963446264882, "CfsSubsetEval_NaiveBayesErrRate": 0.16205533596837945, "RandomTreeDepth3Kappa": 0.5774924201890493, "J48.001.AUC": 0.8541394809337393, "MeanNoiseToSignalRatio": 65.64915485181135, "NumberOfBinaryFeatures": 2, "Quartile1MutualInformation": 0.00544370659686, "REPTreeDepth1ErrRate": 0.14031620553359683, "CfsSubsetEval_NaiveBayesKappa": 0.6619465854095716, "CfsSubsetEval_kNN1NAUC": 0.9030415800750728, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.1857707509881423, "MeanNominalAttDistinctValues": 2, "Quartile1SkewnessOfNumericAtts": -0.375466587942593, "REPTreeDepth1Kappa": 0.706664271600503, "CfsSubsetEval_kNN1NErrRate": 0.16205533596837945, "kNN1NAUC": 0.8082580187843346, "J48.001.Kappa": 0.6113607765594103, "MeanSkewnessOfNumericAtts": 0.6815088940587999, "Quartile1StdDevOfNumericAtts": 2.1205189758993193, "REPTreeDepth2AUC": 0.8852963446264882, "CfsSubsetEval_kNN1NKappa": 0.6619465854095716, "kNN1NErrRate": 0.18181818181818182, "MajorityClassPercentage": 58.69565217391305, "MeanStdDevOfNumericAtts": 28.975222020981562, "Quartile2AttributeEntropy": 0.3628184439419491, "REPTreeDepth2ErrRate": 0.14031620553359683, "ClassEntropy": 0.978070970973496, "kNN1NKappa": 0.6218051831992852, "MajorityClassSize": 297, "MinAttributeEntropy": 0.3628184439419491, "Quartile2KurtosisOfNumericAtts": 0.2116369944394767, "REPTreeDepth2Kappa": 0.706664271600503, "REPTreeDepth3AUC": 0.8852963446264882, "DecisionStumpAUC": 0.8453675511091779, "MaxAttributeEntropy": 0.3628184439419491, "MinKurtosisOfNumericAtts": -1.2335396011495194, "Quartile2MeansOfNumericAtts": 11.250207509881431, "REPTreeDepth3ErrRate": 0.14031620553359683, "DecisionStumpErrRate": 0.17984189723320157, "MaxKurtosisOfNumericAtts": 37.130509129522004, "MinMeansOfNumericAtts": 0.5546950592885375, "Quartile2MutualInformation": 0.00544370659686 }, "tags": [ { "uploader": "2", "tag": "binarized_regression_problem" }, { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "64", "tag": "study_7" } ], "features": [ { "name": "binaryClass", "index": "13", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "297", "0" ], [ "0", "209" ] ] ] }, { "name": "CRIM", "index": "0", "type": "numeric", "distinct": "504", "missing": "0", "min": "0", "max": "89", "mean": "4", "stdev": "9" }, { "name": "ZN", "index": "1", "type": "numeric", "distinct": "26", "missing": "0", "min": "0", "max": "100", "mean": "11", "stdev": "23" }, { "name": "INDUS", "index": "2", "type": "numeric", "distinct": "76", "missing": "0", "min": "0", "max": "28", "mean": "11", "stdev": "7" }, { "name": "CHAS", "index": "3", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "282", "189" ], [ "15", "20" ] ] ] }, { "name": "NOX", "index": "4", "type": "numeric", "distinct": "81", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "RM", "index": "5", "type": "numeric", "distinct": "446", "missing": "0", "min": "4", "max": "9", "mean": "6", "stdev": "1" }, { "name": "AGE", "index": "6", "type": "numeric", "distinct": "356", "missing": "0", "min": "3", "max": "100", "mean": "69", "stdev": "28" }, { "name": "DIS", "index": "7", "type": "numeric", "distinct": "412", "missing": "0", "min": "1", "max": "12", "mean": "4", "stdev": "2" }, { "name": "RAD", "index": "8", "type": "numeric", "distinct": "9", "missing": "0", "min": "1", "max": "24", "mean": "10", "stdev": "9" }, { "name": "TAX", "index": "9", "type": "numeric", "distinct": "66", "missing": "0", "min": "187", "max": "711", "mean": "408", "stdev": "169" }, { "name": "PTRATIO", "index": "10", "type": "numeric", "distinct": "46", "missing": "0", "min": "13", "max": "22", "mean": "18", "stdev": "2" }, { "name": "B", "index": "11", "type": "numeric", "distinct": "357", "missing": "0", "min": "0", "max": "397", "mean": "357", "stdev": "91" }, { "name": "LSTAT", "index": "12", "type": "numeric", "distinct": "455", "missing": "0", "min": "2", "max": "38", "mean": "13", "stdev": "7" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }