{ "data_id": "810", "name": "pbc", "exact_name": "pbc", "version": 3, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:34:05", "update_comment": null, "last_update": "2014-10-04 14:34:05", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53344\/pbc.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 723, "suggest": { "input": [ "pbc", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 418, "NumberOfFeatures": 19, "NumberOfClasses": 2, "NumberOfMissingValues": 1239, "NumberOfInstancesWithMissingValues": 142, "NumberOfNumericFeatures": 10, "NumberOfSymbolicFeatures": 9, "REPTreeDepth3Kappa": 0.3470090537982622, "DecisionStumpKappa": 0.21869158878504663, "MaxMeansOfNumericAtts": 1982.6557692307697, "MinMutualInformation": 0.00100008382517, "Quartile2SkewnessOfNumericAtts": 2.263458074946497, "RandomTreeDepth1AUC": 0.6259935643498621, "Dimensionality": 0.045454545454545456, "MaxMutualInformation": 0.06477883637486, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 36.84210526315789, "Quartile2StdDevOfNumericAtts": 60.92408176457625, "RandomTreeDepth1ErrRate": 0.3803827751196172, "EquivalentNumberOfAtts": 27.940957023638127, "MaxNominalAttDistinctValues": 4, "MinSkewnessOfNumericAtts": -0.46752651417628355, "PercentageOfInstancesWithMissingValues": 33.97129186602871, "Quartile3AttributeEntropy": 0.9883080065735903, "RandomTreeDepth1Kappa": 0.2227939284795471, "J48.00001.AUC": 0.6807677965201457, "MaxSkewnessOfNumericAtts": 3.408525855721415, "MinStdDevOfNumericAtts": 0.4249716057796193, "PercentageOfMissingValues": 15.600604381767816, "Quartile3KurtosisOfNumericAtts": 10.481267833436679, "AutoCorrelation": 0.6306954436450839, "RandomTreeDepth2AUC": 0.6259935643498621, "J48.00001.ErrRate": 0.3444976076555024, "MaxStdDevOfNumericAtts": 2140.3888244517593, "MinorityClassPercentage": 44.97607655502392, "PercentageOfNumericFeatures": 52.63157894736842, "Quartile3MeansOfNumericAtts": 285.14606836349793, "CfsSubsetEval_DecisionStumpAUC": 0.6940911193339502, "RandomTreeDepth2ErrRate": 0.3803827751196172, "J48.00001.Kappa": 0.3026230419872092, "MeanAttributeEntropy": 0.9425249756295572, "MinorityClassSize": 188, "PercentageOfSymbolicFeatures": 47.368421052631575, "Quartile3MutualInformation": 0.0576810521048775, "CfsSubsetEval_DecisionStumpErrRate": 0.33253588516746413, "RandomTreeDepth2Kappa": 0.2227939284795471, "J48.0001.AUC": 0.6807677965201457, "MeanKurtosisOfNumericAtts": 6.665834850291861, "NaiveBayesAUC": 0.7572217931297001, "Quartile1AttributeEntropy": 0.7896534086056475, "Quartile3SkewnessOfNumericAtts": 2.7864166103927372, "CfsSubsetEval_DecisionStumpKappa": 0.3310691012917636, "RandomTreeDepth3AUC": 0.6259935643498621, "J48.0001.ErrRate": 0.3444976076555024, "MeanMeansOfNumericAtts": 302.2289207472942, "NaiveBayesErrRate": 0.33014354066985646, "Quartile1KurtosisOfNumericAtts": 0.7889695506942599, "Quartile3StdDevOfNumericAtts": 131.7303246719448, "CfsSubsetEval_NaiveBayesAUC": 0.6940911193339502, "RandomTreeDepth3ErrRate": 0.3803827751196172, "J48.0001.Kappa": 0.3026230419872092, "MeanMutualInformation": 0.03552866948610125, "NaiveBayesKappa": 0.35369515529063783, "Quartile1MeansOfNumericAtts": 8.923158124769966, "REPTreeDepth1AUC": 0.6962997224791858, "CfsSubsetEval_NaiveBayesErrRate": 0.33253588516746413, "RandomTreeDepth3Kappa": 0.2227939284795471, "J48.001.AUC": 0.6807677965201457, "MeanNoiseToSignalRatio": 25.528575070852884, "NumberOfBinaryFeatures": 7, "Quartile1MutualInformation": 0.0075575106310475, "REPTreeDepth1ErrRate": 0.3277511961722488, "CfsSubsetEval_NaiveBayesKappa": 0.3310691012917636, "CfsSubsetEval_kNN1NAUC": 0.6940911193339502, "StdvNominalAttDistinctValues": 0.7071067811865475, "J48.001.ErrRate": 0.3444976076555024, "MeanNominalAttDistinctValues": 2.3333333333333335, "Quartile1SkewnessOfNumericAtts": 0.4920376088747952, "REPTreeDepth1Kappa": 0.3470090537982622, "CfsSubsetEval_kNN1NErrRate": 0.33253588516746413, "kNN1NAUC": 0.5830712303422757, "J48.001.Kappa": 0.3026230419872092, "MeanSkewnessOfNumericAtts": 1.7865414820330217, "Quartile1StdDevOfNumericAtts": 3.5611298747086373, "REPTreeDepth2AUC": 0.6962997224791858, "CfsSubsetEval_kNN1NKappa": 0.3310691012917636, "kNN1NErrRate": 0.4043062200956938, "MajorityClassPercentage": 55.02392344497608, "MeanStdDevOfNumericAtts": 269.4422690047972, "Quartile2AttributeEntropy": 0.9475561599942943, "REPTreeDepth2ErrRate": 0.3277511961722488, "ClassEntropy": 0.9927050272181983, "kNN1NKappa": 0.16901540995177053, "MajorityClassSize": 230, "MinAttributeEntropy": 0.4233995331297363, "Quartile2KurtosisOfNumericAtts": 7.844679564303095, "REPTreeDepth2Kappa": 0.3470090537982622, "REPTreeDepth3AUC": 0.6962997224791858, "DecisionStumpAUC": 0.633418131359852, "MaxAttributeEntropy": 1.6137794433358423, "MinKurtosisOfNumericAtts": -0.616724760817668, "Quartile2MeansOfNumericAtts": 110.10236662531017, "REPTreeDepth3ErrRate": 0.3277511961722488, "DecisionStumpErrRate": 0.3923444976076555, "MaxKurtosisOfNumericAtts": 14.337869865983695, "MinMeansOfNumericAtts": 3.2208133971291866, "Quartile2MutualInformation": 0.03820824647617 }, "tags": [ { "uploader": "1", "tag": "binarized" }, { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "3886", "tag": "study_123" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" }, { "uploader": "1", "tag": "study_41" } ], "features": [ { "name": "binaryClass", "index": "18", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "230", "0" ], [ "0", "188" ] ] ] }, { "name": "D", "index": "0", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "1", "0" ], [ [ "117", "44" ], [ "113", "144" ] ] ] }, { "name": "Z1", "index": "1", "type": "nominal", "distinct": "2", "missing": "106", "distr": [ [ "1", "2" ], [ [ "80", "78" ], [ "81", "73" ] ] ] }, { "name": "Z2", "index": "2", "type": "numeric", "distinct": "345", "missing": "0", "min": "26", "max": "78", "mean": "51", "stdev": "10" }, { "name": "Z3", "index": "3", "type": "nominal", "distinct": "2", "missing": "106", "distr": [ [ "1", "0" ], [ [ "139", "137" ], [ "22", "14" ] ] ] }, { "name": "Z4", "index": "4", "type": "nominal", "distinct": "2", "missing": "106", "distr": [ [ "1", "0" ], [ [ "21", "3" ], [ "140", "148" ] ] ] }, { "name": "Z5", "index": "5", "type": "nominal", "distinct": "2", "missing": "106", "distr": [ [ "1", "0" ], [ [ "105", "55" ], [ "56", "96" ] ] ] }, { "name": "Z6", "index": "6", "type": "nominal", "distinct": "2", "missing": "106", "distr": [ [ "1", "0" ], [ [ "62", "28" ], [ "99", "123" ] ] ] }, { "name": "Z7", "index": "7", "type": "nominal", "distinct": "3", "missing": "0", "distr": [ [ "1", "0", "0.500000" ], [ [ "19", "1" ], [ "180", "174" ], [ "31", "13" ] ] ] }, { "name": "Z8", "index": "8", "type": "numeric", "distinct": "98", "missing": "0", "min": "0", "max": "28", "mean": "3", "stdev": "4" }, { "name": "Z9", "index": "9", "type": "numeric", "distinct": "201", "missing": "134", "min": "120", "max": "1775", "mean": "370", "stdev": "232" }, { "name": "Z10", "index": "10", "type": "numeric", "distinct": "154", "missing": "0", "min": "2", "max": "5", "mean": "3", "stdev": "0" }, { "name": "Z11", "index": "11", "type": "numeric", "distinct": "158", "missing": "108", "min": "4", "max": "588", "mean": "98", "stdev": "86" }, { "name": "Z12", "index": "12", "type": "numeric", "distinct": "295", "missing": "106", "min": "289", "max": "13862", "mean": "1983", "stdev": "2140" }, { "name": "Z13", "index": "13", "type": "numeric", "distinct": "179", "missing": "106", "min": "26", "max": "457", "mean": "123", "stdev": "57" }, { "name": "Z14", "index": "14", "type": "numeric", "distinct": "146", "missing": "136", "min": "33", "max": "598", "mean": "125", "stdev": "65" }, { "name": "Z15", "index": "15", "type": "numeric", "distinct": "243", "missing": "11", "min": "62", "max": "721", "mean": "257", "stdev": "98" }, { "name": "Z16", "index": "16", "type": "numeric", "distinct": "48", "missing": "2", "min": "9", "max": "18", "mean": "11", "stdev": "1" }, { "name": "Z17", "index": "17", "type": "nominal", "distinct": "4", "missing": "106", "distr": [ [ "4", "3", "2", "1" ], [ [ "77", "32" ], [ "58", "62" ], [ "23", "44" ], [ "3", "13" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }