{ "data_id": "750", "name": "pm10", "exact_name": "pm10", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N').", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 14:32:27", "update_comment": null, "last_update": "2014-10-04 14:32:27", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53284\/pm10.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 758, "suggest": { "input": [ "pm10", "Binarized version of the original data set (see version 1). It converts the numeric target feature to a two-class nominal target feature by computing the mean and classifying all instances with a lower target value as positive ('P') and all others as negative ('N'). " ], "weight": 5 }, "qualities": { "NumberOfInstances": 500, "NumberOfFeatures": 8, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 1, "REPTreeDepth3Kappa": 0.09298144223977406, "DecisionStumpKappa": 0.04791747011183955, "MaxMeansOfNumericAtts": 141.091, "MinMutualInformation": null, "Quartile2SkewnessOfNumericAtts": -0.07115678624409269, "RandomTreeDepth1AUC": 0.5344888291402599, "Dimensionality": 0.016, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 12.5, "Quartile2StdDevOfNumericAtts": 1.860612349908832, "RandomTreeDepth1ErrRate": 0.466, "EquivalentNumberOfAtts": null, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -0.913561198200657, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "RandomTreeDepth1Kappa": 0.06889386189258313, "J48.00001.AUC": 0.5231899366237756, "MaxSkewnessOfNumericAtts": 0.8238986439770583, "MinStdDevOfNumericAtts": 0.8868084438818452, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 0.5937842101601292, "AutoCorrelation": 0.5170340681362725, "RandomTreeDepth2AUC": 0.5344888291402599, "J48.00001.ErrRate": 0.48, "MaxStdDevOfNumericAtts": 85.51077361249645, "MinorityClassPercentage": 49.2, "PercentageOfNumericFeatures": 87.5, "Quartile3MeansOfNumericAtts": 12.446000000000002, "CfsSubsetEval_DecisionStumpAUC": 0.5, "RandomTreeDepth2ErrRate": 0.466, "J48.00001.Kappa": 0.031195504747142076, "MeanAttributeEntropy": null, "MinorityClassSize": 246, "PercentageOfSymbolicFeatures": 12.5, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": 0.492, "RandomTreeDepth2Kappa": 0.06889386189258313, "J48.0001.AUC": 0.5231899366237756, "MeanKurtosisOfNumericAtts": 0.4989987534076391, "NaiveBayesAUC": 0.5101626016260162, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 0.4614759955514295, "CfsSubsetEval_DecisionStumpKappa": 0, "RandomTreeDepth3AUC": 0.5344888291402599, "J48.0001.ErrRate": 0.48, "MeanMeansOfNumericAtts": 23.99629007714286, "NaiveBayesErrRate": 0.482, "Quartile1KurtosisOfNumericAtts": -1.0026531251028858, "Quartile3StdDevOfNumericAtts": 6.857487460326632, "CfsSubsetEval_NaiveBayesAUC": 0.5, "RandomTreeDepth3ErrRate": 0.466, "J48.0001.Kappa": 0.031195504747142076, "MeanMutualInformation": null, "NaiveBayesKappa": 0.032843200205470754, "Quartile1MeansOfNumericAtts": 0.787, "REPTreeDepth1AUC": 0.5453716151334743, "CfsSubsetEval_NaiveBayesErrRate": 0.492, "RandomTreeDepth3Kappa": 0.06889386189258313, "J48.001.AUC": 0.5231899366237756, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": 0.452, "CfsSubsetEval_NaiveBayesKappa": 0, "CfsSubsetEval_kNN1NAUC": 0.5, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.48, "MeanNominalAttDistinctValues": 2, "Quartile1SkewnessOfNumericAtts": -0.3071873540507745, "REPTreeDepth1Kappa": 0.09298144223977406, "CfsSubsetEval_kNN1NErrRate": 0.492, "kNN1NAUC": 0.555886306894565, "J48.001.Kappa": 0.031195504747142076, "MeanSkewnessOfNumericAtts": -0.0456230691517487, "Quartile1StdDevOfNumericAtts": 0.9886312474765178, "REPTreeDepth2AUC": 0.5453716151334743, "CfsSubsetEval_kNN1NKappa": 0, "kNN1NErrRate": 0.444, "MajorityClassPercentage": 50.8, "MeanStdDevOfNumericAtts": 14.79787251097422, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": 0.452, "ClassEntropy": 0.9998153271549207, "kNN1NKappa": 0.11177261378913009, "MajorityClassSize": 254, "MinAttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 0.27107031541788507, "REPTreeDepth2Kappa": 0.09298144223977406, "REPTreeDepth3AUC": 0.5453716151334743, "DecisionStumpAUC": 0.5263827539850201, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.1673149165628454, "Quartile2MeansOfNumericAtts": 3.27092914, "REPTreeDepth3ErrRate": 0.452, "DecisionStumpErrRate": 0.474, "MaxKurtosisOfNumericAtts": 4.622818194317764, "MinMeansOfNumericAtts": 0.1548, "Quartile2MutualInformation": null }, "tags": [ { "uploader": "2", "tag": "binarized_regression_problem" }, { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "64", "tag": "study_7" }, { "uploader": "4209", "tag": "study_88" } ], "features": [ { "name": "binaryClass", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "254", "0" ], [ "0", "246" ] ] ] }, { "name": "pm10_concentration", "index": "0", "type": "numeric", "distinct": "117", "missing": "0", "min": "1", "max": "5", "mean": "3", "stdev": "1" }, { "name": "cars_per_hour", "index": "1", "type": "numeric", "distinct": "456", "missing": "0", "min": "4", "max": "8", "mean": "7", "stdev": "1" }, { "name": "temperature_at_2m", "index": "2", "type": "numeric", "distinct": "218", "missing": "0", "min": "-19", "max": "22", "mean": "1", "stdev": "6" }, { "name": "wind_speed", "index": "3", "type": "numeric", "distinct": "79", "missing": "0", "min": "0", "max": "10", "mean": "3", "stdev": "2" }, { "name": "temperature_diff_2m_25m", "index": "4", "type": "numeric", "distinct": "62", "missing": "0", "min": "-5", "max": "4", "mean": "0", "stdev": "1" }, { "name": "wind_direction", "index": "5", "type": "numeric", "distinct": "354", "missing": "0", "min": "5", "max": "358", "mean": "141", "stdev": "86" }, { "name": "hour_of_day", "index": "6", "type": "numeric", "distinct": "24", "missing": "0", "min": "1", "max": "24", "mean": "12", "stdev": "7" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }