{ "data_id": "29", "name": "credit-approval", "exact_name": "credit-approval", "version": 1, "version_label": "1", "description": "**Author**: Confidential - Donated by Ross Quinlan \r\n**Source**: [UCI](http:\/\/archive.ics.uci.edu\/ml\/datasets\/credit+approval) - 1987 \r\n**Please cite**: [UCI](http:\/\/archive.ics.uci.edu\/ml\/citation_policy.html) \r\n\r\n**Credit Approval**\r\nThis file concerns credit card applications. All attribute names and values have been changed to meaningless symbols to protect the confidentiality of the data. \r\n \r\nThis dataset is interesting because there is a good mix of attributes -- continuous, nominal with small numbers of values, and nominal with larger numbers of values. There are also a few missing values.", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": null, "contributor": null, "date": "2014-04-06 23:21:38", "update_comment": null, "last_update": "2014-04-06 23:21:38", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/29\/dataset_29_credit-a.arff", "default_target_attribute": "class", "row_id_attribute": null, "ignore_attribute": null, "runs": 25384, "suggest": { "input": [ "credit-approval", "This file concerns credit card applications. All attribute names and values have been changed to meaningless symbols to protect the confidentiality of the data. This dataset is interesting because there is a good mix of attributes -- continuous, nominal with small numbers of values, and nominal with larger numbers of values. There are also a few missing values. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 690, "NumberOfFeatures": 16, "NumberOfClasses": 2, "NumberOfMissingValues": 67, "NumberOfInstancesWithMissingValues": 37, "NumberOfNumericFeatures": 6, "NumberOfSymbolicFeatures": 10, "Quartile2AttributeEntropy": 0.9847953334568664, "REPTreeDepth2ErrRate": 0.14492753623188406, "CfsSubsetEval_kNN1NKappa": 0.7101750574897961, "kNN1NErrRate": 0.1782608695652174, "MajorityClassPercentage": 55.507246376811594, "MeanStdDevOfNumericAtts": 901.5091409447066, "Quartile2KurtosisOfNumericAtts": 15.348780875597205, "REPTreeDepth2Kappa": 0.7105146127188972, "ClassEntropy": 0.9912308989033523, "kNN1NKappa": 0.6382815496739548, "MajorityClassSize": 383, "MinAttributeEntropy": 0.5010395545266964, "Quartile2MeansOfNumericAtts": 18.163447864563295, "REPTreeDepth3AUC": 0.8857766135685188, "DecisionStumpAUC": 0.8590375996121823, "MaxAttributeEntropy": 3.4964402118046265, "MinKurtosisOfNumericAtts": 1.1192361294529984, "Quartile2MutualInformation": 0.02960326183246, "REPTreeDepth3ErrRate": 0.14492753623188406, "DecisionStumpErrRate": 0.14492753623188406, "MaxKurtosisOfNumericAtts": 214.66997242752777, "MinMeansOfNumericAtts": 2.22340579710145, "Quartile2SkewnessOfNumericAtts": 2.8076616546800306, "REPTreeDepth3Kappa": 0.7105146127188972, "DecisionStumpKappa": 0.7116180318139644, "MaxMeansOfNumericAtts": 1017.3855072463792, "MinMutualInformation": 0.0006029571694, "PercentageOfBinaryFeatures": 31.25, "Quartile2StdDevOfNumericAtts": 8.468012873399704, "RandomTreeDepth1AUC": 0.7672209006951606, "Dimensionality": 0.02318840579710145, "MaxMutualInformation": 0.42570942667283, "MinNominalAttDistinctValues": 2, "PercentageOfInstancesWithMissingValues": 5.36231884057971, "Quartile3AttributeEntropy": 1.39388043097786, "RandomTreeDepth1ErrRate": 0.2492753623188406, "EquivalentNumberOfAtts": 10.987754965826467, "MaxNominalAttDistinctValues": 14, "MinSkewnessOfNumericAtts": 1.1458915555559273, "PercentageOfMissingValues": 0.6068840579710145, "Quartile3KurtosisOfNumericAtts": 91.78956656083423, "AutoCorrelation": 0.9782293178519593, "RandomTreeDepth1Kappa": 0.49105006303980503, "J48.00001.AUC": 0.8928568391151631, "MaxSkewnessOfNumericAtts": 13.140655014445356, "MinStdDevOfNumericAtts": 3.3465133592781324, "PercentageOfNumericFeatures": 37.5, "Quartile3MeansOfNumericAtts": 392.35745509815314, "CfsSubsetEval_DecisionStumpAUC": 0.8776120291543702, "RandomTreeDepth2AUC": 0.7672209006951606, "J48.00001.ErrRate": 0.1608695652173913, "MaxStdDevOfNumericAtts": 5210.102598302697, "MinorityClassPercentage": 44.492753623188406, "PercentageOfSymbolicFeatures": 62.5, "Quartile3MutualInformation": 0.13272286566341002, "CfsSubsetEval_DecisionStumpErrRate": 0.14347826086956522, "RandomTreeDepth2ErrRate": 0.2492753623188406, "J48.00001.Kappa": 0.6739935471238732, "MeanAttributeEntropy": 1.2537639123535842, "MinorityClassSize": 307, "Quartile1AttributeEntropy": 0.8162006158245964, "Quartile3SkewnessOfNumericAtts": 7.149553646695756, "CfsSubsetEval_DecisionStumpKappa": 0.7101750574897961, "RandomTreeDepth2Kappa": 0.49105006303980503, "J48.0001.AUC": 0.8928568391151631, "MeanKurtosisOfNumericAtts": 49.931703911167034, "NaiveBayesAUC": 0.8940115780808026, "Quartile1KurtosisOfNumericAtts": 1.9853254475312268, "Quartile3StdDevOfNumericAtts": 1432.8807257446028, "CfsSubsetEval_NaiveBayesAUC": 0.8776120291543702, "RandomTreeDepth3AUC": 0.7672209006951606, "J48.0001.ErrRate": 0.1608695652173913, "MeanMeansOfNumericAtts": 207.0584299702253, "NaiveBayesErrRate": 0.21594202898550724, "Quartile1MeansOfNumericAtts": 2.355851449275366, "REPTreeDepth1AUC": 0.8857766135685188, "CfsSubsetEval_NaiveBayesErrRate": 0.14347826086956522, "RandomTreeDepth3ErrRate": 0.2492753623188406, "J48.0001.Kappa": 0.6739935471238732, "MeanMutualInformation": 0.09021232289819223, "NaiveBayesKappa": 0.5492647768025463, "Quartile1MutualInformation": 0.005378837210200001, "REPTreeDepth1ErrRate": 0.14492753623188406, "CfsSubsetEval_NaiveBayesKappa": 0.7101750574897961, "RandomTreeDepth3Kappa": 0.49105006303980503, "J48.001.AUC": 0.8928568391151631, "MeanNoiseToSignalRatio": 12.897922945277674, "NumberOfBinaryFeatures": 5, "Quartile1SkewnessOfNumericAtts": 1.403082732387671, "REPTreeDepth1Kappa": 0.7105146127188972, "CfsSubsetEval_kNN1NAUC": 0.8776120291543702, "StdvNominalAttDistinctValues": 4.049691346263318, "J48.001.ErrRate": 0.1608695652173913, "MeanNominalAttDistinctValues": 4.2, "Quartile1StdDevOfNumericAtts": 4.48383336548978, "REPTreeDepth2AUC": 0.8857766135685188, "CfsSubsetEval_kNN1NErrRate": 0.14347826086956522, "kNN1NAUC": 0.8184187921517933, "J48.001.Kappa": 0.6739935471238732, "MeanSkewnessOfNumericAtts": 4.423867143578692 }, "tags": [ { "uploader": "38960", "tag": "Machine Learning" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "1", "tag": "OpenML-CC18" }, { "uploader": "348", "tag": "OpenML100" }, { "uploader": "38960", "tag": "Statistics" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "3886", "tag": "study_123" }, { "uploader": "5824", "tag": "study_135" }, { "uploader": "64", "tag": "study_14" }, { "uploader": "5824", "tag": "study_144" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" }, { "uploader": "1", "tag": "study_34" }, { "uploader": "1", "tag": "study_37" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "1856", "tag": "study_70" }, { "uploader": "1935", "tag": "study_98" }, { "uploader": "1", "tag": "study_99" }, { "uploader": "1", "tag": "uci" } ], "features": [ { "name": "class", "index": "15", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "+", "-" ], [ [ "307", "0" ], [ "0", "383" ] ] ] }, { "name": "A1", "index": "0", "type": "nominal", "distinct": "2", "missing": "12", "distr": [ [ "b", "a" ], [ [ "206", "262" ], [ "98", "112" ] ] ] }, { "name": "A2", "index": "1", "type": "numeric", "distinct": "349", "missing": "12", "min": "14", "max": "80", "mean": "32", "stdev": "12" }, { "name": "A3", "index": "2", "type": "numeric", "distinct": "215", "missing": "0", "min": "0", "max": "28", "mean": "5", "stdev": "5" }, { "name": "A4", "index": "3", "type": "nominal", "distinct": "3", "missing": "6", "distr": [ [ "u", "y", "l", "t" ], [ [ "256", "263" ], [ "45", "118" ], [ "2", "0" ], [ "0", "0" ] ] ] }, { "name": "A5", "index": "4", "type": "nominal", "distinct": "3", "missing": "6", "distr": [ [ "g", "p", "gg" ], [ [ "256", "263" ], [ "45", "118" ], [ "2", "0" ] ] ] }, { "name": "A6", "index": "5", "type": "nominal", "distinct": "14", "missing": "9", "distr": [ [ "c", "d", "cc", "i", "j", "k", "m", "r", "q", "w", "x", "e", "aa", "ff" ], [ [ "62", "75" ], [ "7", "23" ], [ "29", "12" ], [ "14", "45" ], [ "3", "7" ], [ "14", "37" ], [ "16", "22" ], [ "2", "1" ], [ "51", "27" ], [ "33", "31" ], [ "32", "6" ], [ "14", "11" ], [ "19", "35" ], [ "7", "46" ] ] ] }, { "name": "A7", "index": "6", "type": "nominal", "distinct": "9", "missing": "9", "distr": [ [ "v", "h", "bb", "j", "n", "z", "dd", "ff", "o" ], [ [ "169", "230" ], [ "87", "51" ], [ "25", "34" ], [ "3", "5" ], [ "2", "2" ], [ "6", "2" ], [ "2", "4" ], [ "8", "49" ], [ "1", "1" ] ] ] }, { "name": "A8", "index": "7", "type": "numeric", "distinct": "132", "missing": "0", "min": "0", "max": "29", "mean": "2", "stdev": "3" }, { "name": "A9", "index": "8", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "284", "77" ], [ "23", "306" ] ] ] }, { "name": "A10", "index": "9", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "209", "86" ], [ "98", "297" ] ] ] }, { "name": "A11", "index": "10", "type": "numeric", "distinct": "23", "missing": "0", "min": "0", "max": "67", "mean": "2", "stdev": "5" }, { "name": "A12", "index": "11", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "146", "170" ], [ "161", "213" ] ] ] }, { "name": "A13", "index": "12", "type": "nominal", "distinct": "3", "missing": "0", "distr": [ [ "g", "p", "s" ], [ [ "287", "338" ], [ "5", "3" ], [ "15", "42" ] ] ] }, { "name": "A14", "index": "13", "type": "numeric", "distinct": "170", "missing": "13", "min": "0", "max": "2000", "mean": "184", "stdev": "174" }, { "name": "A15", "index": "14", "type": "numeric", "distinct": "240", "missing": "0", "min": "0", "max": "100000", "mean": "1017", "stdev": "5210" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }