{ "data_id": "947", "name": "arsenic-male-bladder", "exact_name": "arsenic-male-bladder", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun.", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 22:16:45", "update_comment": null, "last_update": "2014-10-04 22:16:45", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53481\/arsenic-male-bladder.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 774, "suggest": { "input": [ "arsenic-male-bladder", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 559, "NumberOfFeatures": 5, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 3, "NumberOfSymbolicFeatures": 2, "REPTreeDepth3Kappa": 0.6934543097861304, "DecisionStumpKappa": 0.6934543097861304, "MaxMeansOfNumericAtts": 26738.4203935598, "MinMutualInformation": 0.16846478968512, "Quartile2SkewnessOfNumericAtts": 0.44144296843342257, "RandomTreeDepth1AUC": 0.8554517133956386, "Dimensionality": 0.008944543828264758, "MaxMutualInformation": 0.16846478968512, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 20, "Quartile2StdDevOfNumericAtts": 259.75418695902493, "RandomTreeDepth1ErrRate": 0.01967799642218247, "EquivalentNumberOfAtts": 1.5171453169929718, "MaxNominalAttDistinctValues": 43, "MinSkewnessOfNumericAtts": 0, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": 5.426264754702098, "RandomTreeDepth1Kappa": 0.6934543097861304, "J48.00001.AUC": 0.4995327102803739, "MaxSkewnessOfNumericAtts": 9.625987907165195, "MinStdDevOfNumericAtts": 18.72504312794417, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 105.02116494074556, "AutoCorrelation": 0.9623655913978495, "RandomTreeDepth2AUC": 0.8031931464174454, "J48.00001.ErrRate": 0.04293381037567084, "MaxStdDevOfNumericAtts": 208422.13589209947, "MinorityClassPercentage": 4.293381037567084, "PercentageOfNumericFeatures": 60, "Quartile3MeansOfNumericAtts": 26738.4203935598, "CfsSubsetEval_DecisionStumpAUC": 0.760202492211838, "RandomTreeDepth2ErrRate": 0.025044722719141325, "J48.00001.Kappa": 0, "MeanAttributeEntropy": 5.426264754702098, "MinorityClassSize": 24, "PercentageOfSymbolicFeatures": 40, "Quartile3MutualInformation": 0.16846478968512, "CfsSubsetEval_DecisionStumpErrRate": 0.01967799642218247, "RandomTreeDepth2Kappa": 0.6375509447943678, "J48.0001.AUC": 0.4995327102803739, "MeanKurtosisOfNumericAtts": 34.250533768824674, "NaiveBayesAUC": 0.87297507788162, "Quartile1AttributeEntropy": 5.426264754702098, "Quartile3SkewnessOfNumericAtts": 9.625987907165195, "CfsSubsetEval_DecisionStumpKappa": 0.6934543097861304, "RandomTreeDepth3AUC": 0.7633566978193146, "J48.0001.ErrRate": 0.04293381037567084, "MeanMeansOfNumericAtts": 9034.43082886102, "NaiveBayesErrRate": 0.01967799642218247, "Quartile1KurtosisOfNumericAtts": -1.214406571690584, "Quartile3StdDevOfNumericAtts": 208422.13589209947, "CfsSubsetEval_NaiveBayesAUC": 0.8394080996884735, "RandomTreeDepth3ErrRate": 0.03398926654740608, "J48.0001.Kappa": 0, "MeanMutualInformation": 0.16846478968512, "NaiveBayesKappa": 0.6934543097861304, "Quartile1MeansOfNumericAtts": 52.5, "REPTreeDepth1AUC": 0.8554517133956386, "CfsSubsetEval_NaiveBayesErrRate": 0.01967799642218247, "RandomTreeDepth3Kappa": 0.5601523998840436, "J48.001.AUC": 0.4995327102803739, "MeanNoiseToSignalRatio": 31.210082384837857, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": 0.16846478968512, "REPTreeDepth1ErrRate": 0.01967799642218247, "CfsSubsetEval_NaiveBayesKappa": 0.6934543097861304, "CfsSubsetEval_kNN1NAUC": 0.8658099688473521, "StdvNominalAttDistinctValues": 28.991378028648448, "J48.001.ErrRate": 0.04293381037567084, "MeanNominalAttDistinctValues": 22.5, "Quartile1SkewnessOfNumericAtts": 0, "REPTreeDepth1Kappa": 0.6934543097861304, "CfsSubsetEval_kNN1NErrRate": 0.01967799642218247, "kNN1NAUC": 0.7513239875389408, "J48.001.Kappa": 0, "MeanSkewnessOfNumericAtts": 3.355810291866206, "Quartile1StdDevOfNumericAtts": 18.72504312794417, "REPTreeDepth2AUC": 0.8554517133956386, "CfsSubsetEval_kNN1NKappa": 0.6934543097861304, "kNN1NErrRate": 0.03577817531305903, "MajorityClassPercentage": 95.70661896243293, "MeanStdDevOfNumericAtts": 69566.87170739548, "Quartile2AttributeEntropy": 5.426264754702098, "REPTreeDepth2ErrRate": 0.01967799642218247, "ClassEntropy": 0.2555855667489857, "kNN1NKappa": 0.5465974531592179, "MajorityClassSize": 535, "MinAttributeEntropy": 5.426264754702098, "Quartile2KurtosisOfNumericAtts": -1.0551570625809767, "REPTreeDepth2Kappa": 0.6934543097861304, "REPTreeDepth3AUC": 0.8554517133956386, "DecisionStumpAUC": 0.760202492211838, "MaxAttributeEntropy": 5.426264754702098, "MinKurtosisOfNumericAtts": -1.214406571690584, "Quartile2MeansOfNumericAtts": 312.37209302325346, "REPTreeDepth3ErrRate": 0.01967799642218247, "DecisionStumpErrRate": 0.01967799642218247, "MaxKurtosisOfNumericAtts": 105.02116494074556, "MinMeansOfNumericAtts": 52.5, "Quartile2MutualInformation": 0.16846478968512 }, "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "64", "tag": "study_7" } ], "features": [ { "name": "binaryClass", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "535", "0" ], [ "0", "24" ] ] ] }, { "name": "group", "index": "0", "type": "nominal", "distinct": "43", "missing": "0", "distr": [ [ "1", "2", "3", "4", "5", "6", "7", "8", "9", "10", "11", "12", "13", "14", "15", "16", "17", "18", "19", "20", "21", "22", "23", "24", "25", "26", "27", "28", "29", "30", "31", "32", "33", "34", "35", "36", "37", "38", "39", "40", "41", "42", "43" ], [ [ "0", "13" ], [ "13", "0" ], [ "13", "0" ], [ "12", "1" ], [ "12", "1" ], [ "12", "1" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "11", "2" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "12", "1" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "12", "1" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "10", "3" ], [ "13", "0" ], [ "13", "0" ], [ "13", "0" ], [ "12", "1" ] ] ] }, { "name": "conc", "index": "1", "type": "numeric", "distinct": "38", "missing": "0", "min": "0", "max": "934", "mean": "312", "stdev": "260" }, { "name": "age", "index": "2", "type": "numeric", "distinct": "13", "missing": "0", "min": "23", "max": "83", "mean": "53", "stdev": "19" }, { "name": "at.risk", "index": "3", "type": "numeric", "distinct": "425", "missing": "0", "min": "10", "max": "2956638", "mean": "26738", "stdev": "208422" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }