{ "data_id": "40509", "name": "Australian", "exact_name": "Australian", "version": 3, "version_label": "2", "description": "**Author**: Confidential. Donated by Ross Quinlan \r\n**Source**: [LibSVM] (https:\/\/www.csie.ntu.edu.tw\/~cjlin\/libsvmtools\/datasets\/binary.html), [UCI](https:\/\/archive.ics.uci.edu\/ml\/datasets\/Statlog+(Australian+Credit+Approval)) - 1987 \r\n**Please cite**: [UCI](https:\/\/archive.ics.uci.edu\/ml\/citation_policy.html) \r\n\r\n**Australian Credit Approval**. This is the famous Australian Credit Approval dataset, originating from the StatLog project. It concerns credit card applications. All attribute names and values have been changed to meaningless symbols to protect the confidentiality of the data. \r\n\r\nThis dataset was retrieved 2014-11-14 from the libSVM site. It was normalized to [-1,1] and converted to the ARFF format.\r\n\r\n### Feature information\r\n\r\nThere are 6 numerical and 8 categorical attributes, all normalized to [-1,1]. The original formatting was as follows: \r\n\r\nA1: 0,1 CATEGORICAL (formerly: a,b) \r\nA2: continuous. \r\nA3: continuous. \r\nA4: 1,2,3 CATEGORICAL (formerly: p,g,gg) \r\nA5: 1, 2,3,4,5, 6,7,8,9,10,11,12,13,14 CATEGORICAL (formerly: ff,d,i,k,j,aa,m,c,w, e, q, r,cc, x) \r\nA6: 1, 2,3, 4,5,6,7,8,9 CATEGORICAL (formerly: ff,dd,j,bb,v,n,o,h,z) \r\nA7: continuous. \r\nA8: 1, 0 CATEGORICAL (formerly: t, f) \r\nA9: 1, 0 CATEGORICAL (formerly: t, f) \r\nA10: continuous. \r\nA11: 1, 0 CATEGORICAL (formerly t, f) \r\nA12: 1, 2, 3 CATEGORICAL (formerly: s, g, p) \r\nA13: continuous. \r\nA14: continuous. \r\nA15: 1,2 class attribute (formerly: +,-) \r\n\r\n### Relevant Papers\r\n\r\nRoss Quinlan. \"Simplifying decision trees\", Int J Man-Machine Studies 27, Dec 1987, pp. 221-234. \r\n\r\nRoss Quinlan. \"C4.5: Programs for Machine Learning\", Morgan Kaufmann, Oct 1992 ", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2016-09-21 15:43:02", "update_comment": null, "last_update": "2016-09-21 15:43:02", "licence": "Public", "status": "deactivated", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/4599631\/phpjP8PU3", "default_target_attribute": "Y", "row_id_attribute": null, "ignore_attribute": null, "runs": 208613, "suggest": { "input": [ "Australian", "This dataset was retrieved 2014-11-14 from the libSVM site. It was normalized to [-1,1] and converted to the ARFF format. ### Feature information There are 6 numerical and 8 categorical attributes, all normalized to [-1,1]. The original formatting was as follows: A1: 0,1 CATEGORICAL (formerly: a,b) A2: continuous. A3: continuous. A4: 1,2,3 CATEGORICAL (formerly: p,g,gg) A5: 1, 2,3,4,5, 6,7,8,9,10,11,12,13,14 CATEGORICAL (formerly: ff,d,i,k,j,aa,m,c,w, e, q, r,cc, x) A6: 1, 2,3, 4,5,6,7,8,9 CATEG " ], "weight": 5 }, "qualities": { "NumberOfInstances": 690, "NumberOfFeatures": 15, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 14, "NumberOfSymbolicFeatures": 1, "ClassEntropy": 0.9912308989033523, "MeanNoiseToSignalRatio": null, "Quartile2AttributeEntropy": null, "Dimensionality": 0.021739130434782608, "MeanNominalAttDistinctValues": 2, "Quartile2KurtosisOfNumericAtts": 0.5069628352788187, "EquivalentNumberOfAtts": null, "MeanSkewnessOfNumericAtts": 1.6774974008065446, "Quartile2MeansOfNumericAtts": -0.18913043478260885, "MajorityClassPercentage": 55.507246376811594, "MeanStdDevOfNumericAtts": 0.5060005412827685, "Quartile2MutualInformation": null, "MajorityClassSize": 383, "MinAttributeEntropy": null, "Quartile2SkewnessOfNumericAtts": 0.38099919060115417, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.9971378336902383, "PercentageOfBinaryFeatures": 6.666666666666667, "Quartile2StdDevOfNumericAtts": 0.39327614078162537, "MaxKurtosisOfNumericAtts": 214.6699724275264, "MinMeansOfNumericAtts": -0.9796522898550725, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "MaxMeansOfNumericAtts": 0.3565217391304348, "MinMutualInformation": null, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 13.381823553347559, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 2, "PercentageOfNumericFeatures": 93.33333333333333, "Quartile3MeansOfNumericAtts": -0.05816611630434777, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -1.9447254706547883, "PercentageOfSymbolicFeatures": 6.666666666666667, "Quartile3MutualInformation": null, "MaxSkewnessOfNumericAtts": 13.140655014445555, "MinStdDevOfNumericAtts": 0.10420205196605362, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 2.7852666666708323, "MaxStdDevOfNumericAtts": 0.9996486625400516, "MinorityClassPercentage": 44.492753623188406, "Quartile1KurtosisOfNumericAtts": -1.544179019410057, "Quartile3StdDevOfNumericAtts": 0.9487635976176738, "MeanAttributeEntropy": null, "MinorityClassSize": 307, "Quartile1MeansOfNumericAtts": -0.8229820112318841, "StdvNominalAttDistinctValues": 0, "MeanKurtosisOfNumericAtts": 21.295222015029267, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": null, "MeanMeansOfNumericAtts": -0.35136002080745343, "Quartile1SkewnessOfNumericAtts": -0.2610067256377514, "AutoCorrelation": 0.5195936139332366, "MeanMutualInformation": null, "Quartile1StdDevOfNumericAtts": 0.21917208085894788 }, "tags": [ { "tag": "study_123", "uploader": "3886" }, { "tag": "study_14", "uploader": "2" }, { "tag": "uci", "uploader": "2" } ], "features": [ { "name": "Y", "index": "0", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "-1", "1" ], [ [ "383", "0" ], [ "0", "307" ] ] ] }, { "name": "X1", "index": "1", "type": "numeric", "distinct": "2", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "1" }, { "name": "X2", "index": "2", "type": "numeric", "distinct": "350", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "0" }, { "name": "X3", "index": "3", "type": "numeric", "distinct": "215", "missing": "0", "min": "-1", "max": "1", "mean": "-1", "stdev": "0" }, { "name": "X4", "index": "4", "type": "numeric", "distinct": "3", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "0" }, { "name": "X5", "index": "5", "type": "numeric", "distinct": "14", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "1" }, { "name": "X6", "index": "6", "type": "numeric", "distinct": "8", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "0" }, { "name": "X7", "index": "7", "type": "numeric", "distinct": "132", "missing": "0", "min": "-1", "max": "1", "mean": "-1", "stdev": "0" }, { "name": "X8", "index": "8", "type": "numeric", "distinct": "2", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "1" }, { "name": "X9", "index": "9", "type": "numeric", "distinct": "2", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "1" }, { "name": "X10", "index": "10", "type": "numeric", "distinct": "23", "missing": "0", "min": "-1", "max": "1", "mean": "-1", "stdev": "0" }, { "name": "X11", "index": "11", "type": "numeric", "distinct": "2", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "1" }, { "name": "X12", "index": "12", "type": "numeric", "distinct": "3", "missing": "0", "min": "-1", "max": "1", "mean": "0", "stdev": "0" }, { "name": "X13", "index": "13", "type": "numeric", "distinct": "171", "missing": "0", "min": "-1", "max": "1", "mean": "-1", "stdev": "0" }, { "name": "X14", "index": "14", "type": "numeric", "distinct": "240", "missing": "0", "min": "-1", "max": "1", "mean": "-1", "stdev": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }