{ "data_id": "939", "name": "chscase_whale", "exact_name": "chscase_whale", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:37:40", "update_comment": "col_1 is a row id", "last_update": "2015-04-15 17:34:14", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53473\/chscase_whale.arff", "default_target_attribute": "binaryClass", "row_id_attribute": "col_1", "ignore_attribute": null, "runs": 118, "suggest": { "input": [ "chscase_whale", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 228, "NumberOfFeatures": 9, "NumberOfClasses": 2, "NumberOfMissingValues": 20, "NumberOfInstancesWithMissingValues": 5, "NumberOfNumericFeatures": 8, "NumberOfSymbolicFeatures": 1, "REPTreeDepth3Kappa": 0.9736842105263157, "DecisionStumpKappa": 0.9736842105263157, "MaxMeansOfNumericAtts": 331.19282511210736, "MinMutualInformation": null, "Quartile2SkewnessOfNumericAtts": 0.24998368566466883, "RandomTreeDepth1AUC": 0.9584199584199584, "Dimensionality": 0.039473684210526314, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 11.11111111111111, "Quartile2StdDevOfNumericAtts": 10.096190797680036, "RandomTreeDepth1ErrRate": 0.05263157894736842, "EquivalentNumberOfAtts": null, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -0.10496357019603114, "PercentageOfInstancesWithMissingValues": 2.1929824561403506, "Quartile3AttributeEntropy": null, "RandomTreeDepth1Kappa": 0.8946152068407671, "J48.00001.AUC": 0.984984984984985, "MaxSkewnessOfNumericAtts": 1.1576198625962384, "MinStdDevOfNumericAtts": 0.5011001113409407, "PercentageOfMissingValues": 0.9746588693957114, "Quartile3KurtosisOfNumericAtts": 1.665286521567358, "AutoCorrelation": 0.5110132158590308, "RandomTreeDepth2AUC": 0.9584199584199584, "J48.00001.ErrRate": 0.013157894736842105, "MaxStdDevOfNumericAtts": 197.19831227143783, "MinorityClassPercentage": 48.68421052631579, "PercentageOfNumericFeatures": 88.88888888888889, "Quartile3MeansOfNumericAtts": 130.74671052631575, "CfsSubsetEval_DecisionStumpAUC": 0.984984984984985, "RandomTreeDepth2ErrRate": 0.05263157894736842, "J48.00001.Kappa": 0.9736842105263157, "MeanAttributeEntropy": null, "MinorityClassSize": 111, "PercentageOfSymbolicFeatures": 11.11111111111111, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": 0.013157894736842105, "RandomTreeDepth2Kappa": 0.8946152068407671, "J48.0001.AUC": 0.984984984984985, "MeanKurtosisOfNumericAtts": 0.4028994077746712, "NaiveBayesAUC": 0.9792869792869793, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 0.8957261397892282, "CfsSubsetEval_DecisionStumpKappa": 0.9736842105263157, "RandomTreeDepth3AUC": 0.9584199584199584, "J48.0001.ErrRate": 0.013157894736842105, "MeanMeansOfNumericAtts": 80.3989925064904, "NaiveBayesErrRate": 0.021929824561403508, "Quartile1KurtosisOfNumericAtts": -0.8881483411265974, "Quartile3StdDevOfNumericAtts": 76.95794847899725, "CfsSubsetEval_NaiveBayesAUC": 0.984984984984985, "RandomTreeDepth3ErrRate": 0.05263157894736842, "J48.0001.Kappa": 0.9736842105263157, "MeanMutualInformation": null, "NaiveBayesKappa": 0.9561605906783571, "Quartile1MeansOfNumericAtts": 9.264441232003776, "REPTreeDepth1AUC": 0.984984984984985, "CfsSubsetEval_NaiveBayesErrRate": 0.013157894736842105, "RandomTreeDepth3Kappa": 0.8946152068407671, "J48.001.AUC": 0.984984984984985, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": 0.013157894736842105, "CfsSubsetEval_NaiveBayesKappa": 0.9736842105263157, "CfsSubsetEval_kNN1NAUC": 0.984984984984985, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.013157894736842105, "MeanNominalAttDistinctValues": 2, "Quartile1SkewnessOfNumericAtts": -0.030880859209178695, "REPTreeDepth1Kappa": 0.9736842105263157, "CfsSubsetEval_kNN1NErrRate": 0.013157894736842105, "kNN1NAUC": 0.9871794871794872, "J48.001.Kappa": 0.9736842105263157, "MeanSkewnessOfNumericAtts": 0.4059507391437395, "Quartile1StdDevOfNumericAtts": 3.318023287882183, "REPTreeDepth2AUC": 0.984984984984985, "CfsSubsetEval_kNN1NKappa": 0.9736842105263157, "kNN1NErrRate": 0.013157894736842105, "MajorityClassPercentage": 51.31578947368421, "MeanStdDevOfNumericAtts": 46.28345209300907, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": 0.013157894736842105, "ClassEntropy": 0.9995003941817588, "kNN1NKappa": 0.9736842105263157, "MajorityClassSize": 117, "MinAttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 0.45674753888344144, "REPTreeDepth2Kappa": 0.9736842105263157, "REPTreeDepth3AUC": 0.984984984984985, "DecisionStumpAUC": 0.984984984984985, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -2.0177777777777783, "Quartile2MeansOfNumericAtts": 21.464096058531982, "REPTreeDepth3ErrRate": 0.013157894736842105, "DecisionStumpErrRate": 0.013157894736842105, "MaxKurtosisOfNumericAtts": 2.5190542688020283, "MinMeansOfNumericAtts": 0.5, "Quartile2MutualInformation": null }, "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" } ], "features": [ { "name": "binaryClass", "index": "9", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "111", "0" ], [ "0", "117" ] ] ] }, { "name": "col_1", "index": "0", "type": "numeric", "distinct": "228", "missing": "0", "identifier": "1", "min": "1", "max": "228", "mean": "115", "stdev": "66" }, { "name": "col_2", "index": "1", "type": "numeric", "distinct": "19", "missing": "0", "min": "0", "max": "18", "mean": "9", "stdev": "3" }, { "name": "col_3", "index": "2", "type": "numeric", "distinct": "156", "missing": "0", "min": "0", "max": "482", "mean": "137", "stdev": "81" }, { "name": "col_4", "index": "3", "type": "numeric", "distinct": "34", "missing": "0", "min": "0", "max": "49", "mean": "16", "stdev": "9" }, { "name": "col_6", "index": "4", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "1" }, { "name": "col_7", "index": "5", "type": "numeric", "distinct": "223", "missing": "5", "min": "1", "max": "223", "mean": "112", "stdev": "65" }, { "name": "col_8", "index": "6", "type": "numeric", "distinct": "18", "missing": "5", "min": "0", "max": "24", "mean": "11", "stdev": "3" }, { "name": "col_9", "index": "7", "type": "numeric", "distinct": "183", "missing": "5", "min": "0", "max": "954", "mean": "331", "stdev": "197" }, { "name": "col_10", "index": "8", "type": "numeric", "distinct": "38", "missing": "5", "min": "0", "max": "66", "mean": "27", "stdev": "11" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }