{ "data_id": "57", "name": "hypothyroid", "exact_name": "hypothyroid", "version": 1, "version_label": "1", "description": "**Author**: \n**Source**: Unknown - \n**Please cite**: \n\n;\n ; Thyroid disease records supplied by the Garavan Institute and J. Ross\n ; Quinlan, New South Wales Institute, Syndney, Australia.\n ;\n ; 1987.\n ;\n \n hypothyroid, primary hypothyroid, compensated hypothyroid,\n secondary hypothyroid,\n negative.\t\t\t| classes\n \n age:\t\t\t\tcontinuous.\n sex:\t\t\t\tM, F.\n on thyroxine:\t\t\tf, t.\n query on thyroxine:\t\tf, t.\n on antithyroid medication:\tf, t.\n sick:\t\t\t\tf, t.\n pregnant:\t\t\tf, t.\n thyroid surgery:\t\tf, t.\n I131 treatment:\t\t\tf, t.\n query hypothyroid:\t\tf, t.\n query hyperthyroid:\t\tf, t.\n lithium:\t\t\tf, t.\n goitre:\t\t\t\tf, t.\n tumor:\t\t\t\tf, t.\n hypopituitary:\t\t\tf, t.\n psych:\t\t\t\tf, t.\n TSH measured:\t\t\tf, t.\n TSH:\t\t\t\tcontinuous.\n T3 measured:\t\t\tf, t.\n T3:\t\t\t\tcontinuous.\n TT4 measured:\t\t\tf, t.\n TT4:\t\t\t\tcontinuous.\n T4U measured:\t\t\tf, t.\n T4U:\t\t\t\tcontinuous.\n FTI measured:\t\t\tf, t.\n FTI:\t\t\t\tcontinuous.\n TBG measured:\t\t\tf, t.\n TBG:\t\t\t\tcontinuous.\n referral source:\t\tWEST, STMW, SVHC, SVI, SVHD, other.\n\n\n Num Instances: 3772\n Num Attributes: 30\n Num Continuous: 7 (Int 1 \/ Real 6)\n Num Discrete: 23\n Missing values: 6064 \/ 5.4%\n\n name type enum ints real missing distinct (1)\n 1 'age' Int 0% 100% 0% 1 \/ 0% 93 \/ 2% 0% \n 2 'sex' Enum 96% 0% 0% 150 \/ 4% 2 \/ 0% 0% \n 3 'on thyroxine' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 4 'query on thyroxine' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 5 'on antithyroid medicati Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 6 'sick' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 7 'pregnant' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 8 'thyroid surgery' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 9 'I131 treatment' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 10 'query hypothyroid' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 11 'query hyperthyroid' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 12 'lithium' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 13 'goitre' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 14 'tumor' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 15 'hypopituitary' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 16 'psych' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 17 'TSH measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 18 'TSH' Real 0% 11% 79% 369 \/ 10% 287 \/ 8% 2% \n 19 'T3 measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 20 'T3' Real 0% 9% 71% 769 \/ 20% 69 \/ 2% 0% \n 21 'TT4 measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 22 'TT4' Real 0% 94% 0% 231 \/ 6% 241 \/ 6% 1% \n 23 'T4U measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 24 'T4U' Real 0% 2% 87% 387 \/ 10% 146 \/ 4% 1% \n 25 'FTI measured' Enum 100% 0% 0% 0 \/ 0% 2 \/ 0% 0% \n 26 'FTI' Real 0% 90% 0% 385 \/ 10% 234 \/ 6% 2% \n 27 'TBG measured' Enum 100% 0% 0% 0 \/ 0% 1 \/ 0% 0% \n 28 'TBG' Real 0% 0% 0% 3772 \/100% 0 \/ 0% 0% \n 29 'referral source' Enum 100% 0% 0% 0 \/ 0% 5 \/ 0% 0% \n 30 'Class' Enum 100% 0% 0% 0 \/ 0% 4 \/ 0% 0%", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": "Ross Quinlan", "contributor": null, "date": "2014-04-06 23:23:22", "update_comment": null, "last_update": "2014-04-06 23:23:22", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/57\/dataset_57_hypothyroid.arff", "default_target_attribute": "Class", "row_id_attribute": null, "ignore_attribute": null, "runs": 883, "suggest": { "input": [ "hypothyroid", "; ; Thyroid disease records supplied by the Garavan Institute and J. Ross ; Quinlan, New South Wales Institute, Syndney, Australia. ; ; 1987. ; hypothyroid, primary hypothyroid, compensated hypothyroid, secondary hypothyroid, negative. | classes age: continuous. sex: M, F. on thyroxine: f, t. query on thyroxine: f, t. on antithyroid medication: f, t. sick: f, t. pregnant: f, t. thyroid surgery: f, t. I131 treatment: f, t. query hypothyroid: f, t. query hyperthyroid: f, t. lithium: f, t. goitre: " ], "weight": 5 }, "qualities": { "NumberOfInstances": 3772, "NumberOfFeatures": 30, "NumberOfClasses": 4, "NumberOfMissingValues": 6064, "NumberOfInstancesWithMissingValues": 3772, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 23, "Quartile2AttributeEntropy": 0.25937485231702934, "REPTreeDepth2ErrRate": 0.007953340402969246, "CfsSubsetEval_kNN1NKappa": 0.8214494217145025, "kNN1NErrRate": 0.08907741251325557, "MajorityClassPercentage": 92.28525980911984, "MeanStdDevOfNumericAtts": 19.05387758896556, "Quartile2KurtosisOfNumericAtts": 8.87130380657577, "REPTreeDepth2Kappa": 0.946435215295785, "ClassEntropy": 0.46661759698663374, "kNN1NKappa": 0.3399787212879303, "MajorityClassSize": 3481, "MinAttributeEntropy": -0, "Quartile2MeansOfNumericAtts": 28.41132258295655, "REPTreeDepth3AUC": 0.9944985110919476, "DecisionStumpAUC": 0.9844898933771603, "MaxAttributeEntropy": 1.520689912507409, "MinKurtosisOfNumericAtts": 4.073471498748956, "Quartile2MutualInformation": 0.001091317700015, "REPTreeDepth3ErrRate": 0.007953340402969246, "DecisionStumpErrRate": 0.04612937433722163, "MaxKurtosisOfNumericAtts": 238.1814623780636, "MinMeansOfNumericAtts": 0.9949997045790251, "Quartile2SkewnessOfNumericAtts": 1.5381528946217138, "REPTreeDepth3Kappa": 0.946435215295785, "DecisionStumpKappa": 0.714726078305068, "MaxMeansOfNumericAtts": 110.46964865662825, "MinMutualInformation": 0, "PercentageOfBinaryFeatures": 66.66666666666666, "Quartile2StdDevOfNumericAtts": 22.3032143933016, "RandomTreeDepth1AUC": 0.9107382259055059, "Dimensionality": 0.007953340402969246, "MaxMutualInformation": 0.01195055117111, "MinNominalAttDistinctValues": 1, "PercentageOfInstancesWithMissingValues": 100, "Quartile3AttributeEntropy": 0.4759318019149815, "RandomTreeDepth1ErrRate": 0.03685047720042418, "EquivalentNumberOfAtts": 202.5849704152198, "MaxNominalAttDistinctValues": 5, "MinSkewnessOfNumericAtts": 1.232674238507278, "PercentageOfMissingValues": 5.358784022622834, "Quartile3KurtosisOfNumericAtts": 90.94248810329343, "AutoCorrelation": 0.8562715460090162, "RandomTreeDepth1Kappa": 0.7422991986969176, "J48.00001.AUC": 0.9960819087507015, "MaxSkewnessOfNumericAtts": 13.882652755041702, "MinStdDevOfNumericAtts": 0.19545727511328811, "PercentageOfNumericFeatures": 23.333333333333332, "Quartile3MeansOfNumericAtts": 108.85692077754308, "CfsSubsetEval_DecisionStumpAUC": 0.988871524706157, "RandomTreeDepth2AUC": 0.9107382259055059, "J48.00001.ErrRate": 0.005302226935312832, "MaxStdDevOfNumericAtts": 35.604247607641, "MinorityClassPercentage": 0.05302226935312832, "PercentageOfSymbolicFeatures": 76.66666666666667, "Quartile3MutualInformation": 0.002305393613935, "CfsSubsetEval_DecisionStumpErrRate": 0.02704135737009544, "RandomTreeDepth2ErrRate": 0.03685047720042418, "J48.00001.Kappa": 0.9636072438179593, "MeanAttributeEntropy": 0.33755530471128503, "MinorityClassSize": 2, "Quartile1AttributeEntropy": 0.0987401719719687, "Quartile3SkewnessOfNumericAtts": 4.937524038925616, "CfsSubsetEval_DecisionStumpKappa": 0.8214494217145025, "RandomTreeDepth2Kappa": 0.7422991986969176, "J48.0001.AUC": 0.9960819087507015, "MeanKurtosisOfNumericAtts": 51.41313506551009, "NaiveBayesAUC": 0.9342238722214744, "Quartile1KurtosisOfNumericAtts": 5.982197043232063, "Quartile3StdDevOfNumericAtts": 33.71833515687218, "CfsSubsetEval_NaiveBayesAUC": 0.988871524706157, "RandomTreeDepth3AUC": 0.9107382259055059, "J48.0001.ErrRate": 0.005302226935312832, "MeanMeansOfNumericAtts": 46.43668969641138, "NaiveBayesErrRate": 0.04665959703075292, "Quartile1MeansOfNumericAtts": 1.7588748012696314, "REPTreeDepth1AUC": 0.9944985110919476, "CfsSubsetEval_NaiveBayesErrRate": 0.02704135737009544, "RandomTreeDepth3ErrRate": 0.03685047720042418, "J48.0001.Kappa": 0.9636072438179593, "MeanMutualInformation": 0.0023033179412581817, "NaiveBayesKappa": 0.6098333890681739, "Quartile1MutualInformation": 0.00036394692046749994, "REPTreeDepth1ErrRate": 0.007953340402969246, "CfsSubsetEval_NaiveBayesKappa": 0.8214494217145025, "RandomTreeDepth3Kappa": 0.7422991986969176, "J48.001.AUC": 0.9960819087507015, "MeanNoiseToSignalRatio": 145.55176285688822, "NumberOfBinaryFeatures": 20, "Quartile1SkewnessOfNumericAtts": 1.2589465934783108, "REPTreeDepth1Kappa": 0.946435215295785, "CfsSubsetEval_kNN1NAUC": 0.988871524706157, "StdvNominalAttDistinctValues": 0.7776522892681231, "J48.001.ErrRate": 0.005302226935312832, "MeanNominalAttDistinctValues": 2.1739130434782608, "Quartile1StdDevOfNumericAtts": 0.669439962143292, "REPTreeDepth2AUC": 0.9944985110919476, "CfsSubsetEval_kNN1NErrRate": 0.02704135737009544, "kNN1NAUC": 0.6743398856933536, "J48.001.Kappa": 0.9636072438179593, "MeanSkewnessOfNumericAtts": 3.5691918824691085 }, "tags": [ { "uploader": "38960", "tag": "Health" }, { "uploader": "38960", "tag": "Medicine" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "1", "tag": "uci" } ], "topics": [ { "topic": "Artificial datasets", "uploader": "8111" } ], "features": [ { "name": "Class", "index": "29", "type": "nominal", "distinct": "4", "missing": "0", "target": "1", "distr": [ [ "negative", "compensated_hypothyroid", "primary_hypothyroid", "secondary_hypothyroid" ], [ [ "3481", "0", "0", "0" ], [ "0", "194", "0", "0" ], [ "0", "0", "95", "0" ], [ "0", "0", "0", "2" ] ] ] }, { "name": "age", "index": "0", "type": "numeric", "distinct": "93", "missing": "1", "min": "1", "max": "455", "mean": "52", "stdev": "20" }, { "name": "sex", "index": "1", "type": "nominal", "distinct": "2", "missing": "150", "distr": [ [ "F", "M" ], [ [ "2265", "145", "69", "1" ], [ "1077", "42", "22", "1" ] ] ] }, { "name": "on_thyroxine", "index": "2", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3026", "194", "86", "2" ], [ "455", "0", "9", "0" ] ] ] }, { "name": "query_on_thyroxine", "index": "3", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3434", "191", "95", "2" ], [ "47", "3", "0", "0" ] ] ] }, { "name": "on_antithyroid_medication", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3439", "193", "95", "2" ], [ "42", "1", "0", "0" ] ] ] }, { "name": "sick", "index": "5", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3345", "183", "95", "2" ], [ "136", "11", "0", "0" ] ] ] }, { "name": "pregnant", "index": "6", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3428", "194", "95", "2" ], [ "53", "0", "0", "0" ] ] ] }, { "name": "thyroid_surgery", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3430", "194", "93", "2" ], [ "51", "0", "2", "0" ] ] ] }, { "name": "I131_treatment", "index": "8", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3427", "191", "93", "2" ], [ "54", "3", "2", "0" ] ] ] }, { "name": "query_hypothyroid", "index": "9", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3286", "167", "84", "1" ], [ "195", "27", "11", "1" ] ] ] }, { "name": "query_hyperthyroid", "index": "10", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3259", "182", "92", "2" ], [ "222", "12", "3", "0" ] ] ] }, { "name": "lithium", "index": "11", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3464", "193", "95", "2" ], [ "17", "1", "0", "0" ] ] ] }, { "name": "goitre", "index": "12", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3447", "194", "95", "2" ], [ "34", "0", "0", "0" ] ] ] }, { "name": "tumor", "index": "13", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3393", "188", "93", "2" ], [ "88", "6", "2", "0" ] ] ] }, { "name": "hypopituitary", "index": "14", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3480", "194", "95", "2" ], [ "1", "0", "0", "0" ] ] ] }, { "name": "psych", "index": "15", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3305", "186", "95", "2" ], [ "176", "8", "0", "0" ] ] ] }, { "name": "TSH_measured", "index": "16", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3112", "194", "95", "2" ], [ "369", "0", "0", "0" ] ] ] }, { "name": "TSH", "index": "17", "type": "numeric", "distinct": "287", "missing": "369", "min": "0", "max": "530", "mean": "5", "stdev": "25" }, { "name": "T3_measured", "index": "18", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "2758", "157", "86", "2" ], [ "723", "37", "9", "0" ] ] ] }, { "name": "T3", "index": "19", "type": "numeric", "distinct": "69", "missing": "769", "min": "0", "max": "11", "mean": "2", "stdev": "1" }, { "name": "TT4_measured", "index": "20", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3255", "192", "92", "2" ], [ "226", "2", "3", "0" ] ] ] }, { "name": "TT4", "index": "21", "type": "numeric", "distinct": "241", "missing": "231", "min": "2", "max": "430", "mean": "108", "stdev": "36" }, { "name": "T4U_measured", "index": "22", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3119", "177", "88", "1" ], [ "362", "17", "7", "1" ] ] ] }, { "name": "T4U", "index": "23", "type": "numeric", "distinct": "146", "missing": "387", "min": "0", "max": "2", "mean": "1", "stdev": "0" }, { "name": "FTI_measured", "index": "24", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3121", "177", "88", "1" ], [ "360", "17", "7", "1" ] ] ] }, { "name": "FTI", "index": "25", "type": "numeric", "distinct": "234", "missing": "385", "min": "2", "max": "395", "mean": "110", "stdev": "33" }, { "name": "TBG_measured", "index": "26", "type": "nominal", "distinct": "1", "missing": "0", "distr": [ [ "f" ], [ [ "3481", "194", "95", "2" ] ] ] }, { "name": "TBG", "index": "27", "type": "numeric", "distinct": "0", "missing": "3772", "min": "2147483647", "max": "0", "mean": "0", "stdev": "0" }, { "name": "referral_source", "index": "28", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "SVHC", "other", "SVI", "STMW", "SVHD" ], [ [ "375", "10", "1", "0" ], [ "2028", "119", "52", "2" ], [ "937", "58", "39", "0" ], [ "105", "4", "3", "0" ], [ "36", "3", "0", "0" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }