{ "data_id": "923", "name": "visualizing_soil", "exact_name": "visualizing_soil", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:37:15", "update_comment": null, "last_update": "2014-10-04 14:37:15", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53457\/visualizing_soil.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 773, "suggest": { "input": [ "visualizing_soil", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 8641, "NumberOfFeatures": 5, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 3, "NumberOfSymbolicFeatures": 2, "REPTreeDepth3Kappa": 0.999766196987142, "DecisionStumpKappa": 0.7693068439085066, "MaxMeansOfNumericAtts": 50.91380048605486, "MinMutualInformation": 0.25356456681769, "Quartile2SkewnessOfNumericAtts": 0.18800212060082225, "RandomTreeDepth1AUC": 0.9998948032821375, "Dimensionality": 0.0005786367318597385, "MaxMutualInformation": 0.25356456681769, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 40, "Quartile2StdDevOfNumericAtts": 1.1072790823234426, "RandomTreeDepth1ErrRate": 0.0001157273463719477, "EquivalentNumberOfAtts": 3.9152133195034593, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": 0.018177729437555933, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": 0.797754775489027, "RandomTreeDepth1Kappa": 0.9997662079307864, "J48.00001.AUC": 0.9998713991769548, "MaxSkewnessOfNumericAtts": 0.5615952184002584, "MinStdDevOfNumericAtts": 0.42907735828339694, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": -0.007288159544537098, "AutoCorrelation": 0.9994212962962963, "RandomTreeDepth2AUC": 0.9998948032821375, "J48.00001.ErrRate": 0.0001157273463719477, "MaxStdDevOfNumericAtts": 28.81016651712464, "MinorityClassPercentage": 44.99479226941327, "PercentageOfNumericFeatures": 60, "Quartile3MeansOfNumericAtts": 50.91380048605486, "CfsSubsetEval_DecisionStumpAUC": 0.9998713991769548, "RandomTreeDepth2ErrRate": 0.0001157273463719477, "J48.00001.Kappa": 0.999766196987142, "MeanAttributeEntropy": 0.797754775489027, "MinorityClassSize": 3888, "PercentageOfSymbolicFeatures": 40, "Quartile3MutualInformation": 0.25356456681769, "CfsSubsetEval_DecisionStumpErrRate": 0.0001157273463719477, "RandomTreeDepth2Kappa": 0.9997662079307864, "J48.0001.AUC": 0.9998713991769548, "MeanKurtosisOfNumericAtts": -0.7889207845004848, "NaiveBayesAUC": 0.9996792149467653, "Quartile1AttributeEntropy": 0.797754775489027, "Quartile3SkewnessOfNumericAtts": 0.5615952184002584, "CfsSubsetEval_DecisionStumpKappa": 0.999766196987142, "RandomTreeDepth3AUC": 0.9998948032821375, "J48.0001.ErrRate": 0.0001157273463719477, "MeanMeansOfNumericAtts": 17.852376846815574, "NaiveBayesErrRate": 0.05323457933109594, "Quartile1KurtosisOfNumericAtts": -1.2645122468220127, "Quartile3StdDevOfNumericAtts": 28.81016651712464, "CfsSubsetEval_NaiveBayesAUC": 0.9998713991769548, "RandomTreeDepth3ErrRate": 0.0001157273463719477, "J48.0001.Kappa": 0.999766196987142, "MeanMutualInformation": 0.25356456681769, "NaiveBayesKappa": 0.8912826927876011, "Quartile1MeansOfNumericAtts": 0.7385423909269762, "REPTreeDepth1AUC": 0.9999487815362876, "CfsSubsetEval_NaiveBayesErrRate": 0.0001157273463719477, "RandomTreeDepth3Kappa": 0.9997662079307864, "J48.001.AUC": 0.9998713991769548, "MeanNoiseToSignalRatio": 2.1461603074163094, "NumberOfBinaryFeatures": 2, "Quartile1MutualInformation": 0.25356456681769, "REPTreeDepth1ErrRate": 0.0001157273463719477, "CfsSubsetEval_NaiveBayesKappa": 0.999766196987142, "CfsSubsetEval_kNN1NAUC": 0.9998713991769548, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.0001157273463719477, "MeanNominalAttDistinctValues": 2, "Quartile1SkewnessOfNumericAtts": 0.018177729437555933, "REPTreeDepth1Kappa": 0.999766196987142, "CfsSubsetEval_kNN1NErrRate": 0.0001157273463719477, "kNN1NAUC": 0.9971892616662293, "J48.001.Kappa": 0.999766196987142, "MeanSkewnessOfNumericAtts": 0.2559250228128789, "Quartile1StdDevOfNumericAtts": 0.42907735828339694, "REPTreeDepth2AUC": 0.9999487815362876, "CfsSubsetEval_kNN1NKappa": 0.999766196987142, "kNN1NErrRate": 0.002661728966554797, "MajorityClassPercentage": 55.00520773058673, "MeanStdDevOfNumericAtts": 10.11550765257716, "Quartile2AttributeEntropy": 0.797754775489027, "REPTreeDepth2ErrRate": 0.0001157273463719477, "ClassEntropy": 0.9927593693587449, "kNN1NKappa": 0.9946217754513923, "MajorityClassSize": 4753, "MinAttributeEntropy": 0.797754775489027, "Quartile2KurtosisOfNumericAtts": -1.0949619471349044, "REPTreeDepth2Kappa": 0.999766196987142, "REPTreeDepth3AUC": 0.9999487815362876, "DecisionStumpAUC": 0.8915855829413349, "MaxAttributeEntropy": 0.797754775489027, "MinKurtosisOfNumericAtts": -1.2645122468220127, "Quartile2MeansOfNumericAtts": 1.9047876634648768, "REPTreeDepth3ErrRate": 0.0001157273463719477, "DecisionStumpErrRate": 0.11688461983566717, "MaxKurtosisOfNumericAtts": -0.007288159544537098, "MinMeansOfNumericAtts": 0.7385423909269762, "Quartile2MutualInformation": 0.25356456681769 }, "tags": [ { "uploader": "2", "tag": "binarized_regression_problem" }, { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "64", "tag": "study_7" } ], "features": [ { "name": "binaryClass", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "4753", "0" ], [ "0", "3888" ] ] ] }, { "name": "northing", "index": "0", "type": "numeric", "distinct": "7011", "missing": "0", "min": "0", "max": "4", "mean": "2", "stdev": "1" }, { "name": "easting", "index": "1", "type": "numeric", "distinct": "6069", "missing": "0", "min": "0", "max": "2", "mean": "1", "stdev": "0" }, { "name": "resistivity", "index": "2", "type": "numeric", "distinct": "5726", "missing": "0", "min": "1", "max": "166", "mean": "51", "stdev": "29" }, { "name": "isns", "index": "3", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "2665", "3888" ], [ "2088", "0" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }