{ "data_id": "938", "name": "sleuth_ex1221", "exact_name": "sleuth_ex1221", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:37:38", "update_comment": null, "last_update": "2014-10-06 03:37:23", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53472\/sleuth_ex1221.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": "\"river\"", "runs": 112, "suggest": { "input": [ "sleuth_ex1221", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 42, "NumberOfFeatures": 10, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 8, "NumberOfSymbolicFeatures": 2, "REPTreeDepth3Kappa": 0, "DecisionStumpKappa": 0.18678815489749423, "MaxMeansOfNumericAtts": 937888.2380952382, "MinMutualInformation": 0.74667276274686, "Quartile2SkewnessOfNumericAtts": 1.6115238490027792, "RandomTreeDepth1AUC": 0.6510297482837528, "Dimensionality": 0.23809523809523808, "MaxMutualInformation": 0.74667276274686, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 10, "Quartile2StdDevOfNumericAtts": 260.9076749914014, "RandomTreeDepth1ErrRate": 0.3333333333333333, "EquivalentNumberOfAtts": 1.3304988315436987, "MaxNominalAttDistinctValues": 26, "MinSkewnessOfNumericAtts": 0.7473793648795396, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": 4.422577995321605, "RandomTreeDepth1Kappa": 0.2811735941320293, "J48.00001.AUC": 0.7414187643020596, "MaxSkewnessOfNumericAtts": 5.449145336057323, "MinStdDevOfNumericAtts": 9.707878429423422, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 12.740544572089224, "AutoCorrelation": 0.5121951219512195, "RandomTreeDepth2AUC": 0.6510297482837528, "J48.00001.ErrRate": 0.3333333333333333, "MaxStdDevOfNumericAtts": 1360007.5879489325, "MinorityClassPercentage": 45.23809523809524, "PercentageOfNumericFeatures": 80, "Quartile3MeansOfNumericAtts": 7939.649226190474, "CfsSubsetEval_DecisionStumpAUC": 0.6086956521739131, "RandomTreeDepth2ErrRate": 0.3333333333333333, "J48.00001.Kappa": 0.308235294117647, "MeanAttributeEntropy": 4.422577995321605, "MinorityClassSize": 19, "PercentageOfSymbolicFeatures": 20, "Quartile3MutualInformation": 0.74667276274686, "CfsSubsetEval_DecisionStumpErrRate": 0.42857142857142855, "RandomTreeDepth2Kappa": 0.2811735941320293, "J48.0001.AUC": 0.7414187643020596, "MeanKurtosisOfNumericAtts": 7.662814515206366, "NaiveBayesAUC": 0.791762013729977, "Quartile1AttributeEntropy": 4.422577995321605, "Quartile3SkewnessOfNumericAtts": 3.220717920546113, "CfsSubsetEval_DecisionStumpKappa": 0.12702078521939938, "RandomTreeDepth3AUC": 0.6510297482837528, "J48.0001.ErrRate": 0.3333333333333333, "MeanMeansOfNumericAtts": 118707.02407738096, "NaiveBayesErrRate": 0.2857142857142857, "Quartile1KurtosisOfNumericAtts": 0.05410938731880144, "Quartile3StdDevOfNumericAtts": 20965.822838789594, "CfsSubsetEval_NaiveBayesAUC": 0.6086956521739131, "RandomTreeDepth3ErrRate": 0.3333333333333333, "J48.0001.Kappa": 0.308235294117647, "MeanMutualInformation": 0.74667276274686, "NaiveBayesKappa": 0.4285714285714286, "Quartile1MeansOfNumericAtts": 31.17202380952381, "REPTreeDepth1AUC": 0.47597254004576667, "CfsSubsetEval_NaiveBayesErrRate": 0.42857142857142855, "RandomTreeDepth3Kappa": 0.2811735941320293, "J48.001.AUC": 0.7414187643020596, "MeanNoiseToSignalRatio": 4.923047171363026, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": 0.74667276274686, "REPTreeDepth1ErrRate": 0.4523809523809524, "CfsSubsetEval_NaiveBayesKappa": 0.12702078521939938, "CfsSubsetEval_kNN1NAUC": 0.6086956521739131, "StdvNominalAttDistinctValues": 16.97056274847714, "J48.001.ErrRate": 0.3333333333333333, "MeanNominalAttDistinctValues": 14, "Quartile1SkewnessOfNumericAtts": 0.9112659286262209, "REPTreeDepth1Kappa": 0, "CfsSubsetEval_kNN1NErrRate": 0.42857142857142855, "kNN1NAUC": 0.7814645308924485, "J48.001.Kappa": 0.308235294117647, "MeanSkewnessOfNumericAtts": 2.1890668335541528, "Quartile1StdDevOfNumericAtts": 36.2934070277226, "REPTreeDepth2AUC": 0.47597254004576667, "CfsSubsetEval_kNN1NKappa": 0.12702078521939938, "kNN1NErrRate": 0.21428571428571427, "MajorityClassPercentage": 54.761904761904766, "MeanStdDevOfNumericAtts": 173656.56702451623, "Quartile2AttributeEntropy": 4.422577995321605, "REPTreeDepth2ErrRate": 0.4523809523809524, "ClassEntropy": 0.9934472383802027, "kNN1NKappa": 0.5655172413793103, "MajorityClassSize": 23, "MinAttributeEntropy": 4.422577995321605, "Quartile2KurtosisOfNumericAtts": 2.6232549893906976, "REPTreeDepth2Kappa": 0, "REPTreeDepth3AUC": 0.47597254004576667, "DecisionStumpAUC": 0.6384439359267736, "MaxAttributeEntropy": 4.422577995321605, "MinKurtosisOfNumericAtts": -0.3615993022186048, "Quartile2MeansOfNumericAtts": 298.80357142857144, "REPTreeDepth3ErrRate": 0.4523809523809524, "DecisionStumpErrRate": 0.40476190476190477, "MaxKurtosisOfNumericAtts": 32.44514615679193, "MinMeansOfNumericAtts": 13.238095238095239, "Quartile2MutualInformation": 0.74667276274686 }, "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" } ], "features": [ { "name": "binaryClass", "index": "10", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "23", "0" ], [ "0", "19" ] ] ] }, { "name": "river", "index": "0", "type": "nominal", "distinct": "42", "missing": "0", "ignore": "1", "distr": [ [ "Adige", "Amazon", "Caragh", "Columbia", "Danube", "Delaware", "Fraser", "Ganges", "Glaama", "Huanghe", "Hudson", "Kazan_and_Back", "Mackenzie", "Magdalena", "Mekong", "Mersey", "Meuse", "Mississippi", "Murray-Darling", "Nelson", "Niger", "Nile", "Orange", "Orinoco", "Parana", "Po", "Rhine", "Rhone", "Shannon", "St._Lawrence", "Stikine", "Susquehanna", "Tees", "Thames", "Tiber", "Uruguay", "Vistula", "Volga", "Yangtze", "Yukon", "Zaire", "Zambezi" ], [ [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ] ] ] }, { "name": "country", "index": "1", "type": "nominal", "distinct": "26", "missing": "0", "distr": [ [ "Argentina", "Australia", "Canada", "Canada\/USA", "China", "Columbia", "England", "Europe", "France", "India", "Ireland", "Italy", "NE_Africa", "Norway", "Nthlnds\/Belgium", "Poland", "Rumania", "Russia", "SE_Africa", "SE_Asia", "S_Africa", "S_America", "USA", "Venezuela", "W_Africa", "Zaire" ], [ [ "1", "0" ], [ "1", "0" ], [ "4", "1" ], [ "0", "2" ], [ "1", "1" ], [ "0", "1" ], [ "2", "1" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "0", "2" ], [ "3", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "1", "1" ], [ "0", "5" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ] ] ] }, { "name": "discharge", "index": "2", "type": "numeric", "distinct": "39", "missing": "0", "min": "7", "max": "175000", "mean": "10342", "stdev": "27630" }, { "name": "runoff", "index": "3", "type": "numeric", "distinct": "36", "missing": "0", "min": "0", "max": "46", "mean": "13", "stdev": "10" }, { "name": "area", "index": "4", "type": "numeric", "distinct": "41", "missing": "0", "min": "160", "max": "7050000", "mean": "937888", "stdev": "1360008" }, { "name": "density", "index": "5", "type": "numeric", "distinct": "26", "missing": "0", "min": "0", "max": "400", "mean": "85", "stdev": "104" }, { "name": "no3", "index": "6", "type": "numeric", "distinct": "39", "missing": "0", "min": "1", "max": "520", "mean": "62", "stdev": "94" }, { "name": "export", "index": "7", "type": "numeric", "distinct": "42", "missing": "0", "min": "4", "max": "4076", "mean": "732", "stdev": "972" }, { "name": "dep", "index": "8", "type": "numeric", "distinct": "39", "missing": "0", "min": "51", "max": "1648", "mean": "512", "stdev": "418" }, { "name": "nprec", "index": "9", "type": "numeric", "distinct": "33", "missing": "0", "min": "1", "max": "61", "mean": "21", "stdev": "17" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }