{ "data_id": "983", "name": "cmc", "exact_name": "cmc", "version": 2, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nBinarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun.", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-04 22:44:18", "update_comment": null, "last_update": "2014-10-04 22:44:18", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53517\/cmc.arff", "kaggle_url": null, "default_target_attribute": "binaryClass", "row_id_attribute": null, "ignore_attribute": null, "runs": 736, "suggest": { "input": [ "cmc", "Binarized version of the original data set (see version 1). The multi-class target feature is converted to a two-class nominal target feature by re-labeling the majority class as positive ('P') and all others as negative ('N'). Originally converted by Quan Sun. " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1473, "NumberOfFeatures": 10, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 2, "NumberOfSymbolicFeatures": 8, "J48.001.Kappa": 0.3500256750186951, "MeanSkewnessOfNumericAtts": 0.6777315757939906, "Quartile1StdDevOfNumericAtts": 2.3585488626874125, "REPTreeDepth2AUC": 0.701547065604774, "CfsSubsetEval_kNN1NErrRate": 0.30414120841819414, "kNN1NAUC": 0.6211092609196874, "MajorityClassPercentage": 57.298031228784794, "MeanStdDevOfNumericAtts": 5.2928968090790125, "Quartile2AttributeEntropy": 1.4479885111323352, "REPTreeDepth2ErrRate": 0.32382892057026474, "CfsSubsetEval_kNN1NKappa": 0.3475612046958699, "kNN1NErrRate": 0.38357094365241007, "MajorityClassSize": 844, "MinAttributeEntropy": 0.380671663040156, "Quartile2KurtosisOfNumericAtts": 0.2928560302339025, "REPTreeDepth2Kappa": 0.30694796938667807, "ClassEntropy": 0.9845770107616216, "kNN1NKappa": 0.2112072274608633, "MaxAttributeEntropy": 1.8667550694041894, "MinKurtosisOfNumericAtts": -0.9438944908638565, "Quartile2MeansOfNumericAtts": 17.899864222674818, "REPTreeDepth3AUC": 0.701547065604774, "DecisionStumpAUC": 0.5715816876257356, "MaxKurtosisOfNumericAtts": 1.5296065513316615, "MinMeansOfNumericAtts": 3.2613713509843865, "Quartile2MutualInformation": 0.01486312313271, "REPTreeDepth3ErrRate": 0.32382892057026474, "DecisionStumpErrRate": 0.36388323150033947, "MaxMeansOfNumericAtts": 32.53835709436525, "MinMutualInformation": 0.00111384150806, "Quartile2SkewnessOfNumericAtts": 0.6777315757939906, "REPTreeDepth3Kappa": 0.30694796938667807, "DecisionStumpKappa": 0.16661248168618037, "MaxMutualInformation": 0.04390904211006, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 40, "Quartile2StdDevOfNumericAtts": 5.2928968090790125, "RandomTreeDepth1AUC": 0.6246797745612912, "Dimensionality": 0.006788866259334691, "MaxNominalAttDistinctValues": 4, "MinSkewnessOfNumericAtts": 0.25644920548189276, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": 1.757839343635201, "RandomTreeDepth1ErrRate": 0.37338764426340804, "EquivalentNumberOfAtts": 65.02645986797907, "MaxSkewnessOfNumericAtts": 1.0990139461060884, "MinStdDevOfNumericAtts": 2.3585488626874125, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 1.5296065513316615, "AutoCorrelation": 0.9979619565217391, "RandomTreeDepth1Kappa": 0.23758624973179307, "J48.00001.AUC": 0.6956982421507094, "MaxStdDevOfNumericAtts": 8.227244755470613, "MinorityClassPercentage": 42.701968771215206, "PercentageOfNumericFeatures": 20, "Quartile3MeansOfNumericAtts": 32.53835709436525, "CfsSubsetEval_DecisionStumpAUC": 0.6989438211559762, "RandomTreeDepth2AUC": 0.6246797745612912, "J48.00001.ErrRate": 0.30685675492192804, "MeanAttributeEntropy": 1.2208122969788784, "MinorityClassSize": 629, "PercentageOfSymbolicFeatures": 80, "Quartile3MutualInformation": 0.01847383155984, "CfsSubsetEval_DecisionStumpErrRate": 0.30414120841819414, "RandomTreeDepth2ErrRate": 0.37338764426340804, "J48.00001.Kappa": 0.3500256750186951, "MeanKurtosisOfNumericAtts": 0.2928560302339025, "NaiveBayesAUC": 0.6834354915272116, "Quartile1AttributeEntropy": 0.6082239803272842, "Quartile3SkewnessOfNumericAtts": 1.0990139461060884, "CfsSubsetEval_DecisionStumpKappa": 0.3475612046958699, "RandomTreeDepth2Kappa": 0.23758624973179307, "J48.0001.AUC": 0.6956982421507094, "MeanMeansOfNumericAtts": 17.89986422267482, "NaiveBayesErrRate": 0.3394433129667346, "Quartile1KurtosisOfNumericAtts": -0.9438944908638565, "Quartile3StdDevOfNumericAtts": 8.227244755470613, "CfsSubsetEval_NaiveBayesAUC": 0.6989438211559762, "RandomTreeDepth3AUC": 0.6246797745612912, "J48.0001.ErrRate": 0.30685675492192804, "MeanMutualInformation": 0.01514117503491, "NaiveBayesKappa": 0.28639391056137, "Quartile1MeansOfNumericAtts": 3.2613713509843865, "REPTreeDepth1AUC": 0.701547065604774, "CfsSubsetEval_NaiveBayesErrRate": 0.30414120841819414, "RandomTreeDepth3ErrRate": 0.37338764426340804, "J48.0001.Kappa": 0.3500256750186951, "MeanNoiseToSignalRatio": 79.62863642776288, "NumberOfBinaryFeatures": 4, "Quartile1MutualInformation": 0.00391187819022, "REPTreeDepth1ErrRate": 0.32382892057026474, "CfsSubsetEval_NaiveBayesKappa": 0.3475612046958699, "RandomTreeDepth3Kappa": 0.23758624973179307, "J48.001.AUC": 0.6956982421507094, "MeanNominalAttDistinctValues": 3, "Quartile1SkewnessOfNumericAtts": 0.25644920548189276, "REPTreeDepth1Kappa": 0.30694796938667807, "CfsSubsetEval_kNN1NAUC": 0.6989438211559762, "StdvNominalAttDistinctValues": 1.0690449676496976, "J48.001.ErrRate": 0.30685675492192804 }, "tags": [ { "uploader": "38960", "tag": "Education" }, { "uploader": "1", "tag": "mythbusting_1" }, { "uploader": "38960", "tag": "Sociology" }, { "uploader": "38960", "tag": "Statistics" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "5824", "tag": "study_144" }, { "uploader": "939", "tag": "study_15" }, { "uploader": "939", "tag": "study_20" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "64", "tag": "study_7" } ], "features": [ { "name": "binaryClass", "index": "9", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "P", "N" ], [ [ "629", "0" ], [ "0", "844" ] ] ] }, { "name": "Wifes_age", "index": "0", "type": "numeric", "distinct": "34", "missing": "0", "min": "16", "max": "49", "mean": "33", "stdev": "8" }, { "name": "Wifes_education", "index": "1", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "1", "2", "3", "4" ], [ [ "103", "49" ], [ "176", "158" ], [ "175", "235" ], [ "175", "402" ] ] ] }, { "name": "Husbands_education", "index": "2", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "1", "2", "3", "4" ], [ [ "31", "13" ], [ "99", "79" ], [ "161", "191" ], [ "338", "561" ] ] ] }, { "name": "Number_of_children_ever_born", "index": "3", "type": "numeric", "distinct": "15", "missing": "0", "min": "0", "max": "16", "mean": "3", "stdev": "2" }, { "name": "Wifes_religion", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "75", "145" ], [ "554", "699" ] ] ] }, { "name": "Wifes_now_working?", "index": "5", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "170", "199" ], [ "459", "645" ] ] ] }, { "name": "Husbands_occupation", "index": "6", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "1", "2", "3", "4" ], [ [ "158", "278" ], [ "200", "225" ], [ "258", "327" ], [ "13", "14" ] ] ] }, { "name": "Standard-of-living_index", "index": "7", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "1", "2", "3", "4" ], [ [ "80", "49" ], [ "117", "112" ], [ "184", "247" ], [ "248", "436" ] ] ] }, { "name": "Media_exposure", "index": "8", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "0", "1" ], [ [ "555", "809" ], [ "74", "35" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }