{ "data_id": "1011", "name": "ecoli", "exact_name": "ecoli", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun.", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 22:45:09", "update_comment": null, "last_update": "2014-10-04 22:45:09", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53545\/ecoli.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 815, "suggest": { "input": [ "ecoli", "Binarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 336, "NumberOfFeatures": 8, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 1, "REPTreeDepth3Kappa": 0.8613761928679056, "DecisionStumpKappa": 0.6481862710300276, "MaxMeansOfNumericAtts": 0.5014880952380952, "MinMutualInformation": null, "Quartile2SkewnessOfNumericAtts": 0.41422005619784913, "RandomTreeDepth1AUC": 0.9103771875792601, "Dimensionality": 0.023809523809523808, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 12.5, "Quartile2StdDevOfNumericAtts": 0.14815683501342095, "RandomTreeDepth1ErrRate": 0.08630952380952381, "EquivalentNumberOfAtts": null, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -0.16595568511332565, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "RandomTreeDepth1Kappa": 0.8229908443540183, "J48.00001.AUC": 0.9400340592050437, "MaxSkewnessOfNumericAtts": 18.33030277982337, "MinStdDevOfNumericAtts": 0.027277236279499045, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 29.079409081025663, "AutoCorrelation": 0.9970149253731343, "RandomTreeDepth2AUC": 0.9103771875792601, "J48.00001.ErrRate": 0.0744047619047619, "MaxStdDevOfNumericAtts": 0.21575130297051617, "MinorityClassPercentage": 42.55952380952381, "PercentageOfNumericFeatures": 87.5, "Quartile3MeansOfNumericAtts": 0.5001785714285714, "CfsSubsetEval_DecisionStumpAUC": 0.9400340592050437, "RandomTreeDepth2ErrRate": 0.08630952380952381, "J48.00001.Kappa": 0.8471281939288056, "MeanAttributeEntropy": null, "MinorityClassSize": 143, "PercentageOfSymbolicFeatures": 12.5, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": 0.0744047619047619, "RandomTreeDepth2Kappa": 0.8229908443540183, "J48.0001.AUC": 0.9400340592050437, "MeanKurtosisOfNumericAtts": 51.97603083018976, "NaiveBayesAUC": 0.9882604442189934, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 5.559347967337419, "CfsSubsetEval_DecisionStumpKappa": 0.8471281939288056, "RandomTreeDepth3AUC": 0.9103771875792601, "J48.0001.ErrRate": 0.0744047619047619, "MeanMeansOfNumericAtts": 0.4995663265306122, "NaiveBayesErrRate": 0.044642857142857144, "Quartile1KurtosisOfNumericAtts": -0.9382139689565889, "Quartile3StdDevOfNumericAtts": 0.20941051515928003, "CfsSubsetEval_NaiveBayesAUC": 0.9400340592050437, "RandomTreeDepth3ErrRate": 0.08630952380952381, "J48.0001.Kappa": 0.8471281939288056, "MeanMutualInformation": null, "NaiveBayesKappa": 0.9082769163572834, "Quartile1MeansOfNumericAtts": 0.49973214285714285, "REPTreeDepth1AUC": 0.9436573788905394, "CfsSubsetEval_NaiveBayesErrRate": 0.0744047619047619, "RandomTreeDepth3Kappa": 0.8229908443540183, "J48.001.AUC": 0.9400340592050437, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": 0.06845238095238096, "CfsSubsetEval_NaiveBayesKappa": 0.8471281939288056, "CfsSubsetEval_kNN1NAUC": 0.9400340592050437, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.0744047619047619, "MeanNominalAttDistinctValues": 2, "Quartile1SkewnessOfNumericAtts": 0.06286669592022871, "REPTreeDepth1Kappa": 0.8613761928679056, "CfsSubsetEval_kNN1NErrRate": 0.0744047619047619, "kNN1NAUC": 0.9513025834269357, "J48.001.Kappa": 0.8471281939288056, "MeanSkewnessOfNumericAtts": 3.6055010492684385, "Quartile1StdDevOfNumericAtts": 0.08849527872597225, "REPTreeDepth2AUC": 0.9436573788905394, "CfsSubsetEval_kNN1NKappa": 0.8471281939288056, "kNN1NErrRate": 0.047619047619047616, "MajorityClassPercentage": 57.44047619047619, "MeanStdDevOfNumericAtts": 0.14372869668428687, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": 0.06845238095238096, "ClassEntropy": 0.9839667997071854, "kNN1NKappa": 0.9026051668538714, "MajorityClassSize": 193, "MinAttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 0.2594151075222815, "REPTreeDepth2Kappa": 0.8613761928679056, "REPTreeDepth3AUC": 0.9436573788905394, "DecisionStumpAUC": 0.8745063226928512, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.0447542888959216, "Quartile2MeansOfNumericAtts": 0.5000297619047619, "REPTreeDepth3ErrRate": 0.06845238095238096, "DecisionStumpErrRate": 0.17559523809523808, "MaxKurtosisOfNumericAtts": 335.99999999999915, "MinMeansOfNumericAtts": 0.4954761904761904, "Quartile2MutualInformation": null }, "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "64", "tag": "study_7" }, { "uploader": "4209", "tag": "study_88" } ], "features": [ { "name": "binaryClass", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "143", "0" ], [ "0", "193" ] ] ] }, { "name": "mcg", "index": "0", "type": "numeric", "distinct": "78", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "gvh", "index": "1", "type": "numeric", "distinct": "63", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "lip", "index": "2", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "chg", "index": "3", "type": "numeric", "distinct": "2", "missing": "0", "min": "1", "max": "1", "mean": "1", "stdev": "0" }, { "name": "aac", "index": "4", "type": "numeric", "distinct": "59", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "alm1", "index": "5", "type": "numeric", "distinct": "82", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "alm2", "index": "6", "type": "numeric", "distinct": "77", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }