{ "data_id": "854", "name": "fishcatch", "exact_name": "fishcatch", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:35:24", "update_comment": null, "last_update": "2014-10-04 14:35:24", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53388\/fishcatch.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 672, "suggest": { "input": [ "fishcatch", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 158, "NumberOfFeatures": 8, "NumberOfClasses": 2, "NumberOfMissingValues": 87, "NumberOfInstancesWithMissingValues": 87, "NumberOfNumericFeatures": 5, "NumberOfSymbolicFeatures": 3, "REPTreeDepth3Kappa": 0.8839941262848753, "DecisionStumpKappa": 0.8582150432370695, "MaxMeansOfNumericAtts": 31.18860759493671, "MinMutualInformation": 2.57391454e-6, "Quartile2SkewnessOfNumericAtts": 0.40047286122025627, "RandomTreeDepth1AUC": 0.9076023391812865, "Dimensionality": 0.05063291139240506, "MaxMutualInformation": 0.3810166886138, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 25, "Quartile2StdDevOfNumericAtts": 10.024844409876481, "RandomTreeDepth1ErrRate": 0.08860759493670886, "EquivalentNumberOfAtts": 5.092683826728161, "MaxNominalAttDistinctValues": 7, "MinSkewnessOfNumericAtts": -0.47418381274078825, "PercentageOfInstancesWithMissingValues": 55.06329113924051, "Quartile3AttributeEntropy": 2.4874672408677103, "RandomTreeDepth1Kappa": 0.815204678362573, "J48.00001.AUC": 0.9369256474519633, "MaxSkewnessOfNumericAtts": 0.5932779186002889, "MinStdDevOfNumericAtts": 2.2812293830708743, "PercentageOfMissingValues": 6.882911392405064, "Quartile3KurtosisOfNumericAtts": 0.4097586355440106, "AutoCorrelation": 0.9299363057324841, "RandomTreeDepth2AUC": 0.9076023391812865, "J48.00001.ErrRate": 0.06329113924050633, "MaxStdDevOfNumericAtts": 11.637009786666583, "MinorityClassPercentage": 39.87341772151899, "PercentageOfNumericFeatures": 62.5, "Quartile3MeansOfNumericAtts": 29.790822784810125, "CfsSubsetEval_DecisionStumpAUC": 0.9372598162071847, "RandomTreeDepth2ErrRate": 0.08860759493670886, "J48.00001.Kappa": 0.8707672174055292, "MeanAttributeEntropy": 1.7099140624220022, "MinorityClassSize": 63, "PercentageOfSymbolicFeatures": 37.5, "Quartile3MutualInformation": 0.3810166886138, "CfsSubsetEval_DecisionStumpErrRate": 0.06329113924050633, "RandomTreeDepth2Kappa": 0.815204678362573, "J48.0001.AUC": 0.9369256474519633, "MeanKurtosisOfNumericAtts": 0.03493850871997922, "NaiveBayesAUC": 0.98796992481203, "Quartile1AttributeEntropy": 0.9323608839762941, "Quartile3SkewnessOfNumericAtts": 0.5691118008672688, "CfsSubsetEval_DecisionStumpKappa": 0.871440195280716, "RandomTreeDepth3AUC": 0.9076023391812865, "J48.0001.ErrRate": 0.06329113924050633, "MeanMeansOfNumericAtts": 25.636835443037974, "NaiveBayesErrRate": 0.0379746835443038, "Quartile1KurtosisOfNumericAtts": -0.458886687340194, "Quartile3StdDevOfNumericAtts": 11.191790776400175, "CfsSubsetEval_NaiveBayesAUC": 0.9372598162071847, "RandomTreeDepth3ErrRate": 0.08860759493670886, "J48.0001.Kappa": 0.8707672174055292, "MeanMutualInformation": 0.19050963126417, "NaiveBayesKappa": 0.9220522940305871, "Quartile1MeansOfNumericAtts": 20.173101265822787, "REPTreeDepth1AUC": 0.9655806182121972, "CfsSubsetEval_NaiveBayesErrRate": 0.06329113924050633, "RandomTreeDepth3Kappa": 0.815204678362573, "J48.001.AUC": 0.9369256474519633, "MeanNoiseToSignalRatio": 7.975473056535138, "NumberOfBinaryFeatures": 2, "Quartile1MutualInformation": 2.57391454e-6, "REPTreeDepth1ErrRate": 0.056962025316455694, "CfsSubsetEval_NaiveBayesKappa": 0.871440195280716, "CfsSubsetEval_kNN1NAUC": 0.9372598162071847, "StdvNominalAttDistinctValues": 2.886751345948129, "J48.001.ErrRate": 0.06329113924050633, "MeanNominalAttDistinctValues": 3.6666666666666665, "Quartile1SkewnessOfNumericAtts": -0.16998286040798916, "REPTreeDepth1Kappa": 0.8839941262848753, "CfsSubsetEval_kNN1NErrRate": 0.06329113924050633, "kNN1NAUC": 0.9208020050125313, "J48.001.Kappa": 0.8707672174055292, "MeanSkewnessOfNumericAtts": 0.23974614842776312, "Quartile1StdDevOfNumericAtts": 5.288802975165147, "REPTreeDepth2AUC": 0.9655806182121972, "CfsSubsetEval_kNN1NKappa": 0.871440195280716, "kNN1NErrRate": 0.0759493670886076, "MajorityClassPercentage": 60.12658227848101, "MeanStdDevOfNumericAtts": 8.597206382601424, "Quartile2AttributeEntropy": 1.7099140624220022, "REPTreeDepth2ErrRate": 0.056962025316455694, "ClassEntropy": 0.9702053179749841, "kNN1NKappa": 0.8416040100250628, "MajorityClassSize": 95, "MinAttributeEntropy": 0.9323608839762941, "Quartile2KurtosisOfNumericAtts": 0.27294864719226286, "REPTreeDepth2Kappa": 0.8839941262848753, "REPTreeDepth3AUC": 0.9655806182121972, "DecisionStumpAUC": 0.9290726817042606, "MaxAttributeEntropy": 2.4874672408677103, "MinKurtosisOfNumericAtts": -0.9894962095686894, "Quartile2MeansOfNumericAtts": 28.25632911392405, "REPTreeDepth3ErrRate": 0.056962025316455694, "DecisionStumpErrRate": 0.06962025316455696, "MaxKurtosisOfNumericAtts": 0.4276975419429512, "MinMeansOfNumericAtts": 14.119620253164557, "Quartile2MutualInformation": 0.19050963126417 }, "tags": [ { "uploader": "1", "tag": "binarized" }, { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "3886", "tag": "study_123" }, { "uploader": "1", "tag": "study_41" } ], "features": [ { "name": "binaryClass", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "95", "0" ], [ "0", "63" ] ] ] }, { "name": "Species", "index": "0", "type": "nominal", "distinct": "7", "missing": "0", "distr": [ [ "1", "2", "3", "4", "5", "6", "7" ], [ [ "5", "29" ], [ "3", "3" ], [ "20", "0" ], [ "11", "0" ], [ "14", "0" ], [ "5", "12" ], [ "37", "19" ] ] ] }, { "name": "Length1", "index": "1", "type": "numeric", "distinct": "116", "missing": "0", "min": "8", "max": "59", "mean": "26", "stdev": "10" }, { "name": "Length2", "index": "2", "type": "numeric", "distinct": "93", "missing": "0", "min": "8", "max": "63", "mean": "28", "stdev": "11" }, { "name": "Length3", "index": "3", "type": "numeric", "distinct": "124", "missing": "0", "min": "9", "max": "68", "mean": "31", "stdev": "12" }, { "name": "Height", "index": "4", "type": "numeric", "distinct": "108", "missing": "0", "min": "15", "max": "45", "mean": "28", "stdev": "8" }, { "name": "Width", "index": "5", "type": "numeric", "distinct": "66", "missing": "0", "min": "9", "max": "21", "mean": "14", "stdev": "2" }, { "name": "Sex", "index": "6", "type": "nominal", "distinct": "2", "missing": "87", "distr": [ [ "1", "0" ], [ [ "10", "6" ], [ "33", "22" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }