{ "data_id": "881", "name": "mv", "exact_name": "mv", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:36:08", "update_comment": null, "last_update": "2014-10-04 14:36:08", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53415\/mv.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 554, "suggest": { "input": [ "mv", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 40768, "NumberOfFeatures": 11, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 4, "REPTreeDepth3Kappa": 0.9912821419281953, "DecisionStumpKappa": 0.5972150781762856, "MaxMeansOfNumericAtts": 1100.2709723312403, "MinMutualInformation": 1.413943024e-5, "Quartile2SkewnessOfNumericAtts": -0.000785974385041192, "RandomTreeDepth1AUC": 0.9918256680030593, "Dimensionality": 0.00026981946624803766, "MaxMutualInformation": 0.2230909398455, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 27.27272727272727, "Quartile2StdDevOfNumericAtts": 3.0234160845268416, "RandomTreeDepth1ErrRate": 0.007947409733124019, "EquivalentNumberOfAtts": 12.991015473633231, "MaxNominalAttDistinctValues": 3, "MinSkewnessOfNumericAtts": -0.32139705527027734, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": 1.3204199058145483, "RandomTreeDepth1Kappa": 0.9834879689066137, "J48.00001.AUC": 0.9972892857377941, "MaxSkewnessOfNumericAtts": 0.9737649773688049, "MinStdDevOfNumericAtts": 0.5769759987326427, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": -0.9477199965281362, "AutoCorrelation": 0.5169867785218436, "RandomTreeDepth2AUC": 0.9918256680030593, "J48.00001.ErrRate": 0.0032623626373626375, "MaxStdDevOfNumericAtts": 115.27303730661535, "MinorityClassPercentage": 40.342916012558874, "PercentageOfNumericFeatures": 63.63636363636363, "Quartile3MeansOfNumericAtts": 299.22740423861853, "CfsSubsetEval_DecisionStumpAUC": 0.9970314105645728, "RandomTreeDepth2ErrRate": 0.007947409733124019, "J48.00001.Kappa": 0.9932219798789502, "MeanAttributeEntropy": 1.001707660080627, "MinorityClassSize": 16447, "PercentageOfSymbolicFeatures": 36.36363636363637, "Quartile3MutualInformation": 0.2230909398455, "CfsSubsetEval_DecisionStumpErrRate": 0.0032623626373626375, "RandomTreeDepth2Kappa": 0.9834879689066137, "J48.0001.AUC": 0.9972892857377941, "MeanKurtosisOfNumericAtts": -1.0763234053159079, "NaiveBayesAUC": 0.979651568371769, "Quartile1AttributeEntropy": 0.8070522790844934, "Quartile3SkewnessOfNumericAtts": 0.004869004163365361, "CfsSubsetEval_DecisionStumpKappa": 0.9932219798789502, "RandomTreeDepth3AUC": 0.9918256680030593, "J48.0001.ErrRate": 0.0032623626373626375, "MeanMeansOfNumericAtts": 195.93714543823938, "NaiveBayesErrRate": 0.09546703296703296, "Quartile1KurtosisOfNumericAtts": -1.2036877914266522, "Quartile3StdDevOfNumericAtts": 58.04571234111569, "CfsSubsetEval_NaiveBayesAUC": 0.9970314105645728, "RandomTreeDepth3ErrRate": 0.007947409733124019, "J48.0001.Kappa": 0.9932219798789502, "MeanMutualInformation": 0.07489185248075, "NaiveBayesKappa": 0.8050822196638202, "Quartile1MeansOfNumericAtts": -11.03942758810832, "REPTreeDepth1AUC": 0.9985919526051271, "CfsSubsetEval_NaiveBayesErrRate": 0.0032623626373626375, "RandomTreeDepth3Kappa": 0.9834879689066137, "J48.001.AUC": 0.9972892857377941, "MeanNoiseToSignalRatio": 12.375389002937311, "NumberOfBinaryFeatures": 3, "Quartile1MutualInformation": 1.413943024e-5, "REPTreeDepth1ErrRate": 0.004194466248037676, "CfsSubsetEval_NaiveBayesKappa": 0.9932219798789502, "CfsSubsetEval_kNN1NAUC": 0.9970314105645728, "StdvNominalAttDistinctValues": 0.5, "J48.001.ErrRate": 0.0032623626373626375, "MeanNominalAttDistinctValues": 2.25, "Quartile1SkewnessOfNumericAtts": -0.005807327596648444, "REPTreeDepth1Kappa": 0.9912821419281953, "CfsSubsetEval_kNN1NErrRate": 0.0032623626373626375, "kNN1NAUC": 0.9216630712714634, "J48.001.Kappa": 0.9932219798789502, "MeanSkewnessOfNumericAtts": 0.09261384330417145, "Quartile1StdDevOfNumericAtts": 1.4439636702716634, "REPTreeDepth2AUC": 0.9985919526051271, "CfsSubsetEval_kNN1NKappa": 0.9932219798789502, "kNN1NErrRate": 0.07604003139717426, "MajorityClassPercentage": 59.657083987441126, "MeanStdDevOfNumericAtts": 27.437454144768495, "Quartile2AttributeEntropy": 0.877650795342839, "REPTreeDepth2ErrRate": 0.004194466248037676, "ClassEntropy": 0.9729212144264806, "kNN1NKappa": 0.8422319268821838, "MajorityClassSize": 24321, "MinAttributeEntropy": 0.8070522790844934, "Quartile2KurtosisOfNumericAtts": -1.1981209273220916, "REPTreeDepth2Kappa": 0.9912821419281953, "REPTreeDepth3AUC": 0.9985919526051271, "DecisionStumpAUC": 0.8236443059377037, "MaxAttributeEntropy": 1.3204199058145483, "MinKurtosisOfNumericAtts": -1.2054637290423134, "Quartile2MeansOfNumericAtts": -0.0034792165178571775, "REPTreeDepth3ErrRate": 0.004194466248037676, "DecisionStumpErrRate": 0.20884026687598117, "MaxKurtosisOfNumericAtts": -0.5884095133947267, "MinMeansOfNumericAtts": -12.49774613912873, "Quartile2MutualInformation": 0.00157047816651 }, "tags": [ { "uploader": "2", "tag": "binarized_regression_problem" }, { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "64", "tag": "study_7" } ], "features": [ { "name": "binaryClass", "index": "10", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "16447", "0" ], [ "0", "24321" ] ] ] }, { "name": "x1", "index": "0", "type": "numeric", "distinct": "40104", "missing": "0", "min": "-5", "max": "5", "mean": "0", "stdev": "3" }, { "name": "x2", "index": "1", "type": "numeric", "distinct": "27796", "missing": "0", "min": "-15", "max": "0", "mean": "-12", "stdev": "1" }, { "name": "x3", "index": "2", "type": "nominal", "distinct": "3", "missing": "0", "distr": [ [ "brown", "red", "green" ], [ [ "10174", "14379" ], [ "4603", "6738" ], [ "1670", "3204" ] ] ] }, { "name": "x4", "index": "3", "type": "numeric", "distinct": "39010", "missing": "0", "min": "-7", "max": "2", "mean": "-4", "stdev": "3" }, { "name": "x5", "index": "4", "type": "numeric", "distinct": "40390", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "1" }, { "name": "x6", "index": "5", "type": "numeric", "distinct": "39832", "missing": "0", "min": "-37", "max": "12", "mean": "-11", "stdev": "11" }, { "name": "x7", "index": "6", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "11521", "17137" ], [ "4926", "7184" ] ] ] }, { "name": "x8", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "normal", "large" ], [ [ "16447", "14237" ], [ "0", "10084" ] ] ] }, { "name": "x9", "index": "8", "type": "numeric", "distinct": "38738", "missing": "0", "min": "100", "max": "500", "mean": "299", "stdev": "115" }, { "name": "x10", "index": "9", "type": "numeric", "distinct": "201", "missing": "0", "min": "1000", "max": "1200", "mean": "1100", "stdev": "58" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }