{ "data_id": "45553", "name": "FICO-HELOC-cleaned", "exact_name": "FICO-HELOC-cleaned", "version": 1, "version_label": null, "description": "This dataset is from the \"Explainable Machine Learning Challenge\":\n\n> The Explainable Machine Learning Challenge is a collaboration between Google, FICO and academics at Berkeley, Oxford, Imperial, UC Irvine and MIT, to generate new research in the area of algorithmic explainability. Teams will be challenged to create machine learning models with both high accuracy and explainability; they will use a real-world financial dataset provided by FICO. Designers and end users of machine learning algorithms will both benefit from more interpretable and explainable algorithms. Machine learning model designers will benefit from Model explanations, written explanations describing the functioning of a trained model. These might include information about which variables or examples are particularly important, they might explain the logic used by an algorithm, and\/or characterize input\/output relationships between variables and predictions. We expect teams to tell the story of their model such that these explanations will be qualitatively evaluated by data scientists at FICO.\n\nFurther information can be retrieved from the [FICO website](https:\/\/community.fico.com\/s\/explainable-machine-learning-challenge).\n\n**Notes**\n* We have obtained the dataset from [Kaggle](https:\/\/www.kaggle.com\/datasets\/averkiyoliabev\/home-equity-line-of-creditheloc)\n* This is a cleaned version of the Kaggle dataset, in which we have removed all rows that only contained `-9`, a special value according to the FAQ.\n* Please request access to the data on the FICO website to obtain the full description of the features.\n* In this version we have encoded the special values (-9, -8, -7) as missing values to make the data more amenable to non-tree models.", "format": "arff", "uploader": "Matthias Feurer", "uploader_id": 86, "visibility": "public", "creator": null, "contributor": null, "date": "2023-06-04 17:23:16", "update_comment": null, "last_update": "2023-06-04 17:23:16", "licence": "Unknown (Kaggle)\/Custom (FICO website)", "status": "active", "error_message": null, "url": "https:\/\/api.openml.org\/data\/download\/22116521\/dataset", "default_target_attribute": "RiskPerformance", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "FICO-HELOC-cleaned", "This dataset is from the \"Explainable Machine Learning Challenge\": > The Explainable Machine Learning Challenge is a collaboration between Google, FICO and academics at Berkeley, Oxford, Imperial, UC Irvine and MIT, to generate new research in the area of algorithmic explainability. Teams will be challenged to create machine learning models with both high accuracy and explainability; they will use a real-world financial dataset provided by FICO. Designers and end users of machine learning algori " ], "weight": 5 }, "qualities": { "NumberOfInstances": 9871, "NumberOfFeatures": 24, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 21, "NumberOfSymbolicFeatures": 3, "PercentageOfBinaryFeatures": 4.166666666666666, "PercentageOfInstancesWithMissingValues": 0, "AutoCorrelation": 0.5592705167173252, "PercentageOfMissingValues": 0, "Dimensionality": 0.002431364603383649, "PercentageOfNumericFeatures": 87.5, "MajorityClassPercentage": 52.03120251241009, "PercentageOfSymbolicFeatures": 12.5, "MajorityClassSize": 5136, "MinorityClassPercentage": 47.96879748758991, "MinorityClassSize": 4735, "NumberOfBinaryFeatures": 1 }, "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" } ], "features": [ { "name": "RiskPerformance", "index": "0", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "Bad", "Good" ], [ [ "5136", "0" ], [ "0", "4735" ] ] ] }, { "name": "ExternalRiskEstimate", "index": "1", "type": "numeric", "distinct": "61", "missing": "0", "min": "-9", "max": "94", "mean": "72", "stdev": "10" }, { "name": "MSinceOldestTradeOpen", "index": "2", "type": "numeric", "distinct": "525", "missing": "0", "min": "-8", "max": "803", "mean": "196", "stdev": "102" }, { "name": "MSinceMostRecentTradeOpen", "index": "3", "type": "numeric", "distinct": "111", "missing": "0", "min": "0", "max": "383", "mean": "10", "stdev": "13" }, { "name": "AverageMInFile", "index": "4", "type": "numeric", "distinct": "236", "missing": "0", "min": "4", "max": "383", "mean": "79", "stdev": "34" }, { "name": "NumSatisfactoryTrades", "index": "5", "type": "numeric", "distinct": "73", "missing": "0", "min": "0", "max": "79", "mean": "21", "stdev": "11" }, { "name": "NumTrades60Ever2DerogPubRec", "index": "6", "type": "numeric", "distinct": "18", "missing": "0", "min": "0", "max": "19", "mean": "1", "stdev": "1" }, { "name": "NumTrades90Ever2DerogPubRec", "index": "7", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "19", "mean": "0", "stdev": "1" }, { "name": "PercentTradesNeverDelq", "index": "8", "type": "numeric", "distinct": "71", "missing": "0", "min": "0", "max": "100", "mean": "92", "stdev": "12" }, { "name": "MSinceMostRecentDelq", "index": "9", "type": "numeric", "distinct": "86", "missing": "0", "min": "-8", "max": "83", "mean": "8", "stdev": "21" }, { "name": "MaxDelq2PublicRecLast12M", "index": "10", "type": "nominal", "distinct": "9", "missing": "0", "distr": [ [ "-9", "0", "1", "2", "3", "4", "5", "6", "7", "9" ], [ [ "0", "0" ], [ "245", "91" ], [ "34", "20" ], [ "38", "15" ], [ "156", "68" ], [ "1178", "434" ], [ "171", "65" ], [ "1698", "1429" ], [ "1612", "2611" ], [ "4", "2" ] ] ] }, { "name": "MaxDelqEver", "index": "11", "type": "nominal", "distinct": "7", "missing": "0", "distr": [ [ "-9", "2", "3", "4", "5", "6", "7", "8" ], [ [ "0", "0" ], [ "517", "222" ], [ "194", "117" ], [ "216", "105" ], [ "635", "333" ], [ "1714", "1154" ], [ "56", "76" ], [ "1804", "2728" ] ] ] }, { "name": "NumTotalTrades", "index": "12", "type": "numeric", "distinct": "87", "missing": "0", "min": "0", "max": "104", "mean": "23", "stdev": "13" }, { "name": "NumTradesOpeninLast12M", "index": "13", "type": "numeric", "distinct": "18", "missing": "0", "min": "0", "max": "19", "mean": "2", "stdev": "2" }, { "name": "PercentInstallTrades", "index": "14", "type": "numeric", "distinct": "95", "missing": "0", "min": "0", "max": "100", "mean": "35", "stdev": "18" }, { "name": "MSinceMostRecentInqexcl7days", "index": "15", "type": "numeric", "distinct": "27", "missing": "0", "min": "-8", "max": "24", "mean": "0", "stdev": "6" }, { "name": "NumInqLast6M", "index": "16", "type": "numeric", "distinct": "26", "missing": "0", "min": "0", "max": "66", "mean": "1", "stdev": "2" }, { "name": "NumInqLast6Mexcl7days", "index": "17", "type": "numeric", "distinct": "26", "missing": "0", "min": "0", "max": "66", "mean": "1", "stdev": "2" }, { "name": "NetFractionRevolvingBurden", "index": "18", "type": "numeric", "distinct": "127", "missing": "0", "min": "-8", "max": "232", "mean": "34", "stdev": "29" }, { "name": "NetFractionInstallBurden", "index": "19", "type": "numeric", "distinct": "138", "missing": "0", "min": "-8", "max": "471", "mean": "42", "stdev": "42" }, { "name": "NumRevolvingTradesWBalance", "index": "20", "type": "numeric", "distinct": "30", "missing": "0", "min": "-8", "max": "32", "mean": "4", "stdev": "3" }, { "name": "NumInstallTradesWBalance", "index": "21", "type": "numeric", "distinct": "19", "missing": "0", "min": "-8", "max": "23", "mean": "2", "stdev": "3" }, { "name": "NumBank2NatlTradesWHighUtilization", "index": "22", "type": "numeric", "distinct": "18", "missing": "0", "min": "-8", "max": "18", "mean": "1", "stdev": "3" }, { "name": "PercentTradesWBalance", "index": "23", "type": "numeric", "distinct": "94", "missing": "0", "min": "-8", "max": "100", "mean": "66", "stdev": "22" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }