{ "data_id": "43341", "name": "Diabetes-Dataset-2019", "exact_name": "Diabetes-Dataset-2019", "version": 1, "version_label": "v1.0", "description": "Context\nThis dataset was collected by Neha Prerna Tigga and Dr. Shruti Garg of the Department of Computer Science and Engineering, BIT Mesra, Ranchi-835215 for research, non-commercial purposes only. An article is also published implementing this dataset. For more information and citation of this dataset please refer: \nTigga, N. P., Garg, S. (2020). Prediction of Type 2 Diabetes using Machine Learning Classification Methods. Procedia Computer Science, 167, 706-716. DOI: https:\/\/doi.org\/10.1016\/j.procs.2020.03.336\nContent\nThere is a total of 952 instances with 17 independent predictor variables and one binary target or dependent variable, Diabetes. \nAcknowledgements\nWe would like to thank all the participants who contributed towards the building of this dataset.\nInspiration\nTo build a machine learning algorithm to predict if a person has diabetes or not?", "format": "arff", "uploader": "Dustin Carrion", "uploader_id": 30123, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-23 12:18:45", "update_comment": null, "last_update": "2022-03-23 12:18:45", "licence": "Attribution 4.0 International (CC BY 4.0)", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102166\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Diabetes-Dataset-2019", "Context This dataset was collected by Neha Prerna Tigga and Dr. Shruti Garg of the Department of Computer Science and Engineering, BIT Mesra, Ranchi-835215 for research, non-commercial purposes only. An article is also published implementing this dataset. For more information and citation of this dataset please refer: Tigga, N. P., Garg, S. (2020). Prediction of Type 2 Diabetes using Machine Learning Classification Methods. Procedia Computer Science, 167, 706-716. DOI: https:\/\/doi.org\/10.1016\/j. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 952, "NumberOfFeatures": 18, "NumberOfClasses": null, "NumberOfMissingValues": 48, "NumberOfInstancesWithMissingValues": 47, "NumberOfNumericFeatures": 4, "NumberOfSymbolicFeatures": 0, "Dimensionality": 0.018907563025210083, "PercentageOfNumericFeatures": 22.22222222222222, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 4.936974789915967, "AutoCorrelation": null, "PercentageOfMissingValues": 0.2801120448179272 }, "tags": [ { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "Age", "index": "0", "type": "string", "distinct": "4", "missing": "0" }, { "name": "Gender", "index": "1", "type": "string", "distinct": "2", "missing": "0" }, { "name": "Family_Diabetes", "index": "2", "type": "string", "distinct": "2", "missing": "0" }, { "name": "highBP", "index": "3", "type": "string", "distinct": "2", "missing": "0" }, { "name": "PhysicallyActive", "index": "4", "type": "string", "distinct": "4", "missing": "0" }, { "name": "BMI", "index": "5", "type": "numeric", "distinct": "26", "missing": "4", "min": "15", "max": "45", "mean": "26", "stdev": "5" }, { "name": "Smoking", "index": "6", "type": "string", "distinct": "2", "missing": "0" }, { "name": "Alcohol", "index": "7", "type": "string", "distinct": "2", "missing": "0" }, { "name": "Sleep", "index": "8", "type": "numeric", "distinct": "8", "missing": "0", "min": "4", "max": "11", "mean": "7", "stdev": "1" }, { "name": "SoundSleep", "index": "9", "type": "numeric", "distinct": "12", "missing": "0", "min": "0", "max": "11", "mean": "5", "stdev": "2" }, { "name": "RegularMedicine", "index": "10", "type": "string", "distinct": "3", "missing": "0" }, { "name": "JunkFood", "index": "11", "type": "string", "distinct": "4", "missing": "0" }, { "name": "Stress", "index": "12", "type": "string", "distinct": "4", "missing": "0" }, { "name": "BPLevel", "index": "13", "type": "string", "distinct": "6", "missing": "0" }, { "name": "Pregancies", "index": "14", "type": "numeric", "distinct": "5", "missing": "42", "min": "0", "max": "4", "mean": "0", "stdev": "1" }, { "name": "Pdiabetes", "index": "15", "type": "string", "distinct": "3", "missing": "1" }, { "name": "UriationFreq", "index": "16", "type": "string", "distinct": "2", "missing": "0" }, { "name": "Diabetic", "index": "17", "type": "string", "distinct": "3", "missing": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }