{ "data_id": "43682", "name": "Heart-Disease-Dataset-(Comprehensive)", "exact_name": "Heart-Disease-Dataset-(Comprehensive)", "version": 2, "version_label": "v1.0", "description": "Context\nHeart Disease Dataset (Most comprehensive)\nContent\nHeart disease is also known as Cardiovascular diseases (CVDs) are the number 1 cause of death globally, taking an estimated 17.9 million lives each year which is about 32 of all deaths globally. CVDs are a group of disorders of the heart and blood vessels and include coronary heart disease, cerebrovascular disease, rheumatic heart disease, and other conditions. Four out of 5CVD deaths are due to heart attacks and strokes, and one-third of these deaths occur prematurely in people under 70 years of age.\nWe have curated this dataset by combining different datasets already available independently but not combined before. W have combined them over 11 common features which makes it the largest heart disease dataset available for research purposes. The five datasets used for its curation are:\nDatabase: of instances:\n\nCleveland: 303\nHungarian: 294\nSwitzerland: 123\nLong Beach VA: 200\nStalog (Heart) Data Set: 270\n\nTotal 1190\nAcknowledgements\nThe dataset is taken from three other research datasets used in different research papers. The Nature article listing heart disease database and names of popular datasets used in various heart disease research is shared below.\nhttps:\/\/www.nature.com\/articles\/s41597-019-0206-3\nInspiration\nCan you find interesting insight from the largest heart disease dataset available so far and build predictive model which can assist medical practitioners in detecting early-stage heart disease ?", "format": "arff", "uploader": "Dustin Carrion", "uploader_id": 30123, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-24 07:10:44", "update_comment": null, "last_update": "2022-03-24 07:10:44", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102507\/dataset", "default_target_attribute": "target", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Heart-Disease-Dataset-(Comprehensive)", "Context Heart Disease Dataset (Most comprehensive) Content Heart disease is also known as Cardiovascular diseases (CVDs) are the number 1 cause of death globally, taking an estimated 17.9 million lives each year which is about 32 of all deaths globally. CVDs are a group of disorders of the heart and blood vessels and include coronary heart disease, cerebrovascular disease, rheumatic heart disease, and other conditions. Four out of 5CVD deaths are due to heart attacks and strokes, and one-third o " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1190, "NumberOfFeatures": 12, "NumberOfClasses": 0, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 12, "NumberOfSymbolicFeatures": 0, "Dimensionality": 0.010084033613445379, "PercentageOfNumericFeatures": 100, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "AutoCorrelation": 0.5643397813288478, "PercentageOfMissingValues": 0 }, "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "target", "index": "11", "type": "numeric", "distinct": "2", "missing": "0", "target": "1", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "age", "index": "0", "type": "numeric", "distinct": "50", "missing": "0", "min": "28", "max": "77", "mean": "54", "stdev": "9" }, { "name": "sex", "index": "1", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "chest_pain_type", "index": "2", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "3", "stdev": "1" }, { "name": "resting_bp_s", "index": "3", "type": "numeric", "distinct": "67", "missing": "0", "min": "0", "max": "200", "mean": "132", "stdev": "18" }, { "name": "cholesterol", "index": "4", "type": "numeric", "distinct": "222", "missing": "0", "min": "0", "max": "603", "mean": "210", "stdev": "101" }, { "name": "fasting_blood_sugar", "index": "5", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "resting_ecg", "index": "6", "type": "numeric", "distinct": "3", "missing": "0", "min": "0", "max": "2", "mean": "1", "stdev": "1" }, { "name": "max_heart_rate", "index": "7", "type": "numeric", "distinct": "119", "missing": "0", "min": "60", "max": "202", "mean": "140", "stdev": "26" }, { "name": "exercise_angina", "index": "8", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "oldpeak", "index": "9", "type": "numeric", "distinct": "53", "missing": "0", "min": "-3", "max": "6", "mean": "1", "stdev": "1" }, { "name": "ST_slope", "index": "10", "type": "numeric", "distinct": "4", "missing": "0", "min": "0", "max": "3", "mean": "2", "stdev": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }