{ "data_id": "1000", "name": "hypothyroid", "exact_name": "hypothyroid", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun.", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 22:44:48", "update_comment": null, "last_update": "2014-10-04 22:44:48", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53534\/hypothyroid.arff", "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 737, "suggest": { "input": [ "hypothyroid", "Binarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 3772, "NumberOfFeatures": 30, "NumberOfClasses": 2, "NumberOfMissingValues": 6064, "NumberOfInstancesWithMissingValues": 3772, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 23, "REPTreeDepth3Kappa": 0.9548894210789105, "DecisionStumpKappa": 0.8684491204277603, "MaxMeansOfNumericAtts": 110.46964865662825, "MinMutualInformation": 0, "Quartile2SkewnessOfNumericAtts": 1.5381528946217138, "RandomTreeDepth1AUC": 0.9459928444184418, "Dimensionality": 0.007953340402969246, "MaxMutualInformation": 0.01195055117111, "MinNominalAttDistinctValues": 1, "PercentageOfBinaryFeatures": 70, "Quartile2StdDevOfNumericAtts": 22.3032143933016, "RandomTreeDepth1ErrRate": 0.015641569459172854, "EquivalentNumberOfAtts": 234.83251874777525, "MaxNominalAttDistinctValues": 5, "MinSkewnessOfNumericAtts": 1.232674238507278, "PercentageOfInstancesWithMissingValues": 100, "Quartile3AttributeEntropy": 0.4759318019149815, "RandomTreeDepth1Kappa": 0.8892791613100949, "J48.00001.AUC": 0.9881714723705874, "MaxSkewnessOfNumericAtts": 13.882652755041702, "MinStdDevOfNumericAtts": 0.19545727511328811, "PercentageOfMissingValues": 5.358784022622834, "Quartile3KurtosisOfNumericAtts": 90.94248810329343, "AutoCorrelation": 0.8594537258021745, "RandomTreeDepth2AUC": 0.9459928444184418, "J48.00001.ErrRate": 0.00503711558854719, "MaxStdDevOfNumericAtts": 35.604247607641, "MinorityClassPercentage": 7.714740190880169, "PercentageOfNumericFeatures": 23.333333333333332, "Quartile3MeansOfNumericAtts": 108.85692077754308, "CfsSubsetEval_DecisionStumpAUC": 0.9777747832859974, "RandomTreeDepth2ErrRate": 0.015641569459172854, "J48.00001.Kappa": 0.9644569553633956, "MeanAttributeEntropy": 0.33755530471128503, "MinorityClassSize": 291, "PercentageOfSymbolicFeatures": 76.66666666666667, "Quartile3MutualInformation": 0.0021093508107675003, "CfsSubsetEval_DecisionStumpErrRate": 0.02704135737009544, "RandomTreeDepth2Kappa": 0.8892791613100949, "J48.0001.AUC": 0.9881714723705874, "MeanKurtosisOfNumericAtts": 51.41313506551009, "NaiveBayesAUC": 0.9128114452777665, "Quartile1AttributeEntropy": 0.0987401719719687, "Quartile3SkewnessOfNumericAtts": 4.937524038925616, "CfsSubsetEval_DecisionStumpKappa": 0.8147581442689444, "RandomTreeDepth3AUC": 0.9459928444184418, "J48.0001.ErrRate": 0.00503711558854719, "MeanMeansOfNumericAtts": 46.43668969641138, "NaiveBayesErrRate": 0.050106044538706256, "Quartile1KurtosisOfNumericAtts": 5.982197043232063, "Quartile3StdDevOfNumericAtts": 33.71833515687218, "CfsSubsetEval_NaiveBayesAUC": 0.9777747832859974, "RandomTreeDepth3ErrRate": 0.015641569459172854, "J48.0001.Kappa": 0.9644569553633956, "MeanMutualInformation": 0.001669475980666818, "NaiveBayesKappa": 0.5476908318487048, "Quartile1MeansOfNumericAtts": 1.7588748012696314, "REPTreeDepth1AUC": 0.9933996136118408, "CfsSubsetEval_NaiveBayesErrRate": 0.02704135737009544, "RandomTreeDepth3Kappa": 0.8892791613100949, "J48.001.AUC": 0.9881714723705874, "MeanNoiseToSignalRatio": 201.1923697137946, "NumberOfBinaryFeatures": 21, "Quartile1MutualInformation": 2.9259651115000003e-5, "REPTreeDepth1ErrRate": 0.006362672322375398, "CfsSubsetEval_NaiveBayesKappa": 0.8147581442689444, "CfsSubsetEval_kNN1NAUC": 0.9777747832859974, "StdvNominalAttDistinctValues": 0.668311541278118, "J48.001.ErrRate": 0.00503711558854719, "MeanNominalAttDistinctValues": 2.0869565217391304, "Quartile1SkewnessOfNumericAtts": 1.2589465934783108, "REPTreeDepth1Kappa": 0.9548894210789105, "CfsSubsetEval_kNN1NErrRate": 0.02704135737009544, "kNN1NAUC": 0.6649849798266683, "J48.001.Kappa": 0.9644569553633956, "MeanSkewnessOfNumericAtts": 3.5691918824691085, "Quartile1StdDevOfNumericAtts": 0.669439962143292, "REPTreeDepth2AUC": 0.9933996136118408, "CfsSubsetEval_kNN1NKappa": 0.8147581442689444, "kNN1NErrRate": 0.08510074231177095, "MajorityClassPercentage": 92.28525980911984, "MeanStdDevOfNumericAtts": 19.05387758896556, "Quartile2AttributeEntropy": 0.25937485231702934, "REPTreeDepth2ErrRate": 0.006362672322375398, "ClassEntropy": 0.392047249528901, "kNN1NKappa": 0.34792920567492025, "MajorityClassSize": 3481, "MinAttributeEntropy": -0, "Quartile2KurtosisOfNumericAtts": 8.87130380657577, "REPTreeDepth2Kappa": 0.9548894210789105, "REPTreeDepth3AUC": 0.9933996136118408, "DecisionStumpAUC": 0.9839526501745854, "MaxAttributeEntropy": 1.520689912507409, "MinKurtosisOfNumericAtts": 4.073471498748956, "Quartile2MeansOfNumericAtts": 28.41132258295655, "REPTreeDepth3ErrRate": 0.006362672322375398, "DecisionStumpErrRate": 0.020943796394485684, "MaxKurtosisOfNumericAtts": 238.1814623780636, "MinMeansOfNumericAtts": 0.9949997045790251, "Quartile2MutualInformation": 0.000364392640035 }, "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "5824", "tag": "study_144" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" }, { "uploader": "1", "tag": "study_41" } ], "features": [ { "name": "binaryClass", "index": "29", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "3481", "0" ], [ "0", "291" ] ] ] }, { "name": "age", "index": "0", "type": "numeric", "distinct": "93", "missing": "1", "min": "1", "max": "455", "mean": "52", "stdev": "20" }, { "name": "sex", "index": "1", "type": "nominal", "distinct": "2", "missing": "150", "distr": [ [ "F", "M" ], [ [ "2265", "215" ], [ "1077", "65" ] ] ] }, { "name": "on thyroxine", "index": "2", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3026", "282" ], [ "455", "9" ] ] ] }, { "name": "query on thyroxine", "index": "3", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3434", "288" ], [ "47", "3" ] ] ] }, { "name": "on antithyroid medication", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3439", "290" ], [ "42", "1" ] ] ] }, { "name": "sick", "index": "5", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3345", "280" ], [ "136", "11" ] ] ] }, { "name": "pregnant", "index": "6", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3428", "291" ], [ "53", "0" ] ] ] }, { "name": "thyroid surgery", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3430", "289" ], [ "51", "2" ] ] ] }, { "name": "I131 treatment", "index": "8", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3427", "286" ], [ "54", "5" ] ] ] }, { "name": "query hypothyroid", "index": "9", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3286", "252" ], [ "195", "39" ] ] ] }, { "name": "query hyperthyroid", "index": "10", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3259", "276" ], [ "222", "15" ] ] ] }, { "name": "lithium", "index": "11", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3464", "290" ], [ "17", "1" ] ] ] }, { "name": "goitre", "index": "12", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3447", "291" ], [ "34", "0" ] ] ] }, { "name": "tumor", "index": "13", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3393", "283" ], [ "88", "8" ] ] ] }, { "name": "hypopituitary", "index": "14", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3480", "291" ], [ "1", "0" ] ] ] }, { "name": "psych", "index": "15", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "f", "t" ], [ [ "3305", "283" ], [ "176", "8" ] ] ] }, { "name": "TSH measured", "index": "16", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3112", "291" ], [ "369", "0" ] ] ] }, { "name": "TSH", "index": "17", "type": "numeric", "distinct": "287", "missing": "369", "min": "0", "max": "530", "mean": "5", "stdev": "25" }, { "name": "T3 measured", "index": "18", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "2758", "245" ], [ "723", "46" ] ] ] }, { "name": "T3", "index": "19", "type": "numeric", "distinct": "69", "missing": "769", "min": "0", "max": "11", "mean": "2", "stdev": "1" }, { "name": "TT4 measured", "index": "20", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3255", "286" ], [ "226", "5" ] ] ] }, { "name": "TT4", "index": "21", "type": "numeric", "distinct": "241", "missing": "231", "min": "2", "max": "430", "mean": "108", "stdev": "36" }, { "name": "T4U measured", "index": "22", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3119", "266" ], [ "362", "25" ] ] ] }, { "name": "T4U", "index": "23", "type": "numeric", "distinct": "146", "missing": "387", "min": "0", "max": "2", "mean": "1", "stdev": "0" }, { "name": "FTI measured", "index": "24", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "t", "f" ], [ [ "3121", "266" ], [ "360", "25" ] ] ] }, { "name": "FTI", "index": "25", "type": "numeric", "distinct": "234", "missing": "385", "min": "2", "max": "395", "mean": "110", "stdev": "33" }, { "name": "TBG measured", "index": "26", "type": "nominal", "distinct": "1", "missing": "0", "distr": [ [ "f" ], [ [ "3481", "291" ] ] ] }, { "name": "TBG", "index": "27", "type": "numeric", "distinct": "0", "missing": "3772", "min": "2147483647", "max": "0", "mean": "0", "stdev": "0" }, { "name": "referral source", "index": "28", "type": "nominal", "distinct": "5", "missing": "0", "distr": [ [ "SVHC", "other", "SVI", "STMW", "SVHD" ], [ [ "375", "11" ], [ "2028", "173" ], [ "937", "97" ], [ "105", "7" ], [ "36", "3" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }