{ "data_id": "1014", "name": "analcatdata_dmft", "exact_name": "analcatdata_dmft", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun.", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 22:45:13", "update_comment": null, "last_update": "2014-10-04 22:45:13", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53548\/analcatdata_dmft.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 774, "suggest": { "input": [ "analcatdata_dmft", "Binarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 797, "NumberOfFeatures": 5, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 0, "NumberOfSymbolicFeatures": 5, "REPTreeDepth3Kappa": -0.009881816660423856, "DecisionStumpKappa": 0, "MaxMeansOfNumericAtts": null, "MinMutualInformation": 0.00016267085188, "Quartile2SkewnessOfNumericAtts": null, "RandomTreeDepth1AUC": 0.4487438448397146, "Dimensionality": 0.006273525721455458, "MaxMutualInformation": 0.0102955772291, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 40, "Quartile2StdDevOfNumericAtts": null, "RandomTreeDepth1ErrRate": 0.32622333751568383, "EquivalentNumberOfAtts": 125.92009437826562, "MaxNominalAttDistinctValues": 9, "MinSkewnessOfNumericAtts": null, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": 2.9494788749394134, "RandomTreeDepth1Kappa": -0.07270054251045664, "J48.00001.AUC": 0.49838709677419357, "MaxSkewnessOfNumericAtts": null, "MinStdDevOfNumericAtts": null, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": null, "AutoCorrelation": 0.9974874371859297, "RandomTreeDepth2AUC": 0.4487438448397146, "J48.00001.ErrRate": 0.1944792973651192, "MaxStdDevOfNumericAtts": null, "MinorityClassPercentage": 19.44792973651192, "PercentageOfNumericFeatures": 0, "Quartile3MeansOfNumericAtts": null, "CfsSubsetEval_DecisionStumpAUC": 0.49838709677419357, "RandomTreeDepth2ErrRate": 0.32622333751568383, "J48.00001.Kappa": 0, "MeanAttributeEntropy": 2.016975283182629, "MinorityClassSize": 155, "PercentageOfSymbolicFeatures": 100, "Quartile3MutualInformation": 0.009974316830384999, "CfsSubsetEval_DecisionStumpErrRate": 0.1944792973651192, "RandomTreeDepth2Kappa": -0.07270054251045664, "J48.0001.AUC": 0.49838709677419357, "MeanKurtosisOfNumericAtts": null, "NaiveBayesAUC": 0.5193647492537776, "Quartile1AttributeEntropy": 1.108792761984236, "Quartile3SkewnessOfNumericAtts": null, "CfsSubsetEval_DecisionStumpKappa": 0, "RandomTreeDepth3AUC": 0.4487438448397146, "J48.0001.ErrRate": 0.1944792973651192, "MeanMeansOfNumericAtts": null, "NaiveBayesErrRate": 0.1944792973651192, "Quartile1KurtosisOfNumericAtts": null, "Quartile3StdDevOfNumericAtts": null, "CfsSubsetEval_NaiveBayesAUC": 0.49838709677419357, "RandomTreeDepth3ErrRate": 0.32622333751568383, "J48.0001.Kappa": 0, "MeanMutualInformation": 0.005644439214245, "NaiveBayesKappa": 0, "Quartile1MeansOfNumericAtts": null, "REPTreeDepth1AUC": 0.507768063511205, "CfsSubsetEval_NaiveBayesErrRate": 0.1944792973651192, "RandomTreeDepth3Kappa": -0.07270054251045664, "J48.001.AUC": 0.49838709677419357, "MeanNoiseToSignalRatio": 356.3384718347825, "NumberOfBinaryFeatures": 2, "Quartile1MutualInformation": 0.00089924642435, "REPTreeDepth1ErrRate": 0.19949811794228356, "CfsSubsetEval_NaiveBayesKappa": 0, "CfsSubsetEval_kNN1NAUC": 0.49838709677419357, "StdvNominalAttDistinctValues": 3.209361307176242, "J48.001.ErrRate": 0.1944792973651192, "MeanNominalAttDistinctValues": 4.6, "Quartile1SkewnessOfNumericAtts": null, "REPTreeDepth1Kappa": -0.009881816660423856, "CfsSubsetEval_kNN1NErrRate": 0.1944792973651192, "kNN1NAUC": 0.4632298261481258, "J48.001.Kappa": 0, "MeanSkewnessOfNumericAtts": null, "Quartile1StdDevOfNumericAtts": null, "REPTreeDepth2AUC": 0.507768063511205, "CfsSubsetEval_kNN1NKappa": 0, "kNN1NErrRate": 0.29109159347553326, "MajorityClassPercentage": 80.55207026348809, "MeanStdDevOfNumericAtts": null, "Quartile2AttributeEntropy": 1.9926542126242377, "REPTreeDepth2ErrRate": 0.19949811794228356, "ClassEntropy": 0.7107483185701138, "kNN1NKappa": -0.046914810494966375, "MajorityClassSize": 642, "MinAttributeEntropy": 0.9995900071849526, "Quartile2KurtosisOfNumericAtts": null, "REPTreeDepth2Kappa": -0.009881816660423856, "REPTreeDepth3AUC": 0.507768063511205, "DecisionStumpAUC": 0.5250326600341674, "MaxAttributeEntropy": 3.083002700297088, "MinKurtosisOfNumericAtts": null, "Quartile2MeansOfNumericAtts": null, "REPTreeDepth3ErrRate": 0.19949811794228356, "DecisionStumpErrRate": 0.1944792973651192, "MaxKurtosisOfNumericAtts": null, "MinMeansOfNumericAtts": null, "Quartile2MutualInformation": 0.006059754387999999 }, "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "5824", "tag": "study_144" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "64", "tag": "study_7" } ], "features": [ { "name": "binaryClass", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "155", "0" ], [ "0", "642" ] ] ] }, { "name": "DMFT.Begin", "index": "0", "type": "nominal", "distinct": "9", "missing": "0", "distr": [ [ "0", "1", "2", "3", "4", "5", "6", "7", "8" ], [ [ "39", "133" ], [ "17", "56" ], [ "11", "85" ], [ "11", "69" ], [ "15", "80" ], [ "22", "61" ], [ "17", "68" ], [ "13", "52" ], [ "10", "38" ] ] ] }, { "name": "DMFT.End", "index": "1", "type": "nominal", "distinct": "7", "missing": "0", "distr": [ [ "0", "1", "2", "3", "4", "5", "6" ], [ [ "57", "174" ], [ "27", "136" ], [ "24", "116" ], [ "20", "96" ], [ "15", "55" ], [ "11", "44" ], [ "1", "21" ] ] ] }, { "name": "Gender", "index": "2", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "Female", "Male" ], [ [ "86", "303" ], [ "69", "339" ] ] ] }, { "name": "Ethnic", "index": "3", "type": "nominal", "distinct": "3", "missing": "0", "distr": [ [ "Black", "Dark", "White" ], [ [ "21", "91" ], [ "61", "241" ], [ "73", "310" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }