{ "data_id": "760", "name": "analcatdata_uktrainacc", "exact_name": "analcatdata_uktrainacc", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:32:44", "update_comment": "Year is a row id", "last_update": "2015-04-15 17:15:07", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53294\/analcatdata_uktrainacc.arff", "default_target_attribute": "binaryClass", "row_id_attribute": "Year", "ignore_attribute": null, "runs": 100, "suggest": { "input": [ "analcatdata_uktrainacc", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 31, "NumberOfFeatures": 16, "NumberOfClasses": 2, "NumberOfMissingValues": 150, "NumberOfInstancesWithMissingValues": 25, "NumberOfNumericFeatures": 15, "NumberOfSymbolicFeatures": 1, "REPTreeDepth3Kappa": 0, "DecisionStumpKappa": 0.7129629629629627, "MaxMeansOfNumericAtts": 66.25806451612904, "MinMutualInformation": null, "Quartile2SkewnessOfNumericAtts": 1.34674034641558, "RandomTreeDepth1AUC": 0.6944444444444444, "Dimensionality": 0.5161290322580645, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 6.25, "Quartile2StdDevOfNumericAtts": 1.8216145503076304, "RandomTreeDepth1ErrRate": 0.16129032258064516, "EquivalentNumberOfAtts": null, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -1.0381948517135466, "PercentageOfInstancesWithMissingValues": 80.64516129032258, "Quartile3AttributeEntropy": null, "RandomTreeDepth1Kappa": 0.3514644351464437, "J48.00001.AUC": 0.9444444444444444, "MaxSkewnessOfNumericAtts": 3.536425261573178, "MinStdDevOfNumericAtts": 0.01884241383527559, "PercentageOfMissingValues": 30.241935483870968, "Quartile3KurtosisOfNumericAtts": 3.5350676378772175, "AutoCorrelation": 0.7666666666666667, "RandomTreeDepth2AUC": 0.6944444444444444, "J48.00001.ErrRate": 0.06451612903225806, "MaxStdDevOfNumericAtts": 24.50078603084057, "MinorityClassPercentage": 12.903225806451612, "PercentageOfNumericFeatures": 93.75, "Quartile3MeansOfNumericAtts": 8.806451612903228, "CfsSubsetEval_DecisionStumpAUC": 0.8240740740740741, "RandomTreeDepth2ErrRate": 0.16129032258064516, "J48.00001.Kappa": 0.763358778625954, "MeanAttributeEntropy": null, "MinorityClassSize": 4, "PercentageOfSymbolicFeatures": 6.25, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": 0.12903225806451613, "RandomTreeDepth2Kappa": 0.3514644351464437, "J48.0001.AUC": 0.9444444444444444, "MeanKurtosisOfNumericAtts": 2.8879049188842894, "NaiveBayesAUC": 0.5918458781362007, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 1.8259167737442272, "CfsSubsetEval_DecisionStumpKappa": 0.4259259259259259, "RandomTreeDepth3AUC": 0.6944444444444444, "J48.0001.ErrRate": 0.06451612903225806, "MeanMeansOfNumericAtts": 8.403979211469535, "NaiveBayesErrRate": 0.25806451612903225, "Quartile1KurtosisOfNumericAtts": 0.8694263947038703, "Quartile3StdDevOfNumericAtts": 5.612486080160912, "CfsSubsetEval_NaiveBayesAUC": 0.8240740740740741, "RandomTreeDepth3ErrRate": 0.16129032258064516, "J48.0001.Kappa": 0.763358778625954, "MeanMutualInformation": null, "NaiveBayesKappa": 0.0534351145038167, "Quartile1MeansOfNumericAtts": 0.8387096774193548, "REPTreeDepth1AUC": 0.49074074074074076, "CfsSubsetEval_NaiveBayesErrRate": 0.12903225806451613, "RandomTreeDepth3Kappa": 0.3514644351464437, "J48.001.AUC": 0.9444444444444444, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": 0.12903225806451613, "CfsSubsetEval_NaiveBayesKappa": 0.4259259259259259, "CfsSubsetEval_kNN1NAUC": 0.8240740740740741, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.06451612903225806, "MeanNominalAttDistinctValues": 2, "Quartile1SkewnessOfNumericAtts": 0.8573214099741132, "REPTreeDepth1Kappa": 0, "CfsSubsetEval_kNN1NErrRate": 0.12903225806451613, "kNN1NAUC": 0.49074074074074076, "J48.001.Kappa": 0.763358778625954, "MeanSkewnessOfNumericAtts": 1.2864441742247166, "Quartile1StdDevOfNumericAtts": 0.816496580927726, "REPTreeDepth2AUC": 0.49074074074074076, "CfsSubsetEval_kNN1NKappa": 0.4259259259259259, "kNN1NErrRate": 0.12903225806451613, "MajorityClassPercentage": 87.09677419354838, "MeanStdDevOfNumericAtts": 4.65829529713265, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": 0.12903225806451613, "ClassEntropy": 0.5547781633412736, "kNN1NKappa": 0, "MajorityClassSize": 27, "MinAttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 2.0205647709853185, "REPTreeDepth2Kappa": 0, "REPTreeDepth3AUC": 0.49074074074074076, "DecisionStumpAUC": 0.8472222222222222, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.1284289391619282, "Quartile2MeansOfNumericAtts": 2.21, "REPTreeDepth3ErrRate": 0.12903225806451613, "DecisionStumpErrRate": 0.06451612903225806, "MaxKurtosisOfNumericAtts": 14.489616093755057, "MinMeansOfNumericAtts": 0.25806451612903236, "Quartile2MutualInformation": null }, "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" } ], "features": [ { "name": "binaryClass", "index": "16", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "27", "0" ], [ "0", "4" ] ] ] }, { "name": "Year", "index": "0", "type": "numeric", "distinct": "31", "missing": "0", "identifier": "1", "min": "1", "max": "31", "mean": "16", "stdev": "9" }, { "name": "Train_km", "index": "1", "type": "numeric", "distinct": "22", "missing": "0", "min": "0", "max": "0", "mean": "0", "stdev": "0" }, { "name": "Pct_Mark_I", "index": "2", "type": "numeric", "distinct": "31", "missing": "0", "min": "20", "max": "97", "mean": "66", "stdev": "25" }, { "name": "Accidents", "index": "3", "type": "numeric", "distinct": "8", "missing": "0", "min": "0", "max": "7", "mean": "2", "stdev": "2" }, { "name": "SPAD_preventable", "index": "4", "type": "numeric", "distinct": "4", "missing": "0", "min": "0", "max": "5", "mean": "1", "stdev": "1" }, { "name": "Other_preventable", "index": "5", "type": "numeric", "distinct": "3", "missing": "0", "min": "0", "max": "2", "mean": "0", "stdev": "1" }, { "name": "Non_preventable", "index": "6", "type": "numeric", "distinct": "5", "missing": "0", "min": "0", "max": "4", "mean": "1", "stdev": "1" }, { "name": "Year_grouped", "index": "7", "type": "numeric", "distinct": "6", "missing": "25", "min": "3", "max": "29", "mean": "16", "stdev": "9" }, { "name": "Accidents_grouped", "index": "8", "type": "numeric", "distinct": "5", "missing": "25", "min": "7", "max": "23", "mean": "13", "stdev": "6" }, { "name": "SPAD_grouped", "index": "9", "type": "numeric", "distinct": "3", "missing": "25", "min": "3", "max": "5", "mean": "4", "stdev": "1" }, { "name": "Other_grouped", "index": "10", "type": "numeric", "distinct": "4", "missing": "25", "min": "0", "max": "4", "mean": "1", "stdev": "2" }, { "name": "Non_grouped", "index": "11", "type": "numeric", "distinct": "6", "missing": "25", "min": "4", "max": "15", "mean": "8", "stdev": "4" }, { "name": "Train_km_grouped", "index": "12", "type": "numeric", "distinct": "6", "missing": "25", "min": "2", "max": "3", "mean": "2", "stdev": "0" }, { "name": "Fatalities", "index": "13", "type": "numeric", "distinct": "17", "missing": "0", "min": "0", "max": "73", "mean": "9", "stdev": "14" }, { "name": "SPAD_fatalities", "index": "14", "type": "numeric", "distinct": "9", "missing": "0", "min": "0", "max": "12", "mean": "2", "stdev": "3" }, { "name": "Other_fatalities", "index": "15", "type": "numeric", "distinct": "5", "missing": "0", "min": "0", "max": "8", "mean": "1", "stdev": "2" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }