{ "data_id": "1071", "name": "mw1", "exact_name": "mw1", "version": 1, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\n%-*- text -*-\n%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%\nThis is a PROMISE data set made publicly available in order to encourage\nrepeatable, verifiable, refutable, and\/or improvable predictive models\nof software engineering.\n\nIf you publish material based on PROMISE data sets then, please\nfollow the acknowledgment guidelines posted on the PROMISE repository\nweb page http:\/\/promise.site.uottawa.ca\/SERepository .\n%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%\n1. Title\/Topic: MW1\/software defect prediction\n\n(c) 2007 : Tim Menzies : tim@menzies.us\nThis data set is distributed under the\nCreative Commons Attribution-Share Alike 3.0 License\nhttp:\/\/creativecommons.org\/licenses\/by-sa\/3.0\/\n\nYou are free:\n\n* to Share -- copy, distribute and transmit the work\n* to Remix -- to adapt the work\n\nUnder the following conditions:\n\nAttribution. You must attribute the work in the manner specified by\nthe author or licensor (but not in any way that suggests that they endorse\nyou or your use of the work).\n\nShare Alike. If you alter, transform, or build upon this work, you\nmay distribute the resulting work only under the same, similar or a\ncompatible license.\n\n* For any reuse or distribution, you must make clear to others the\nlicense terms of this work.\n* Any of the above conditions can be waived if you get permission from\nthe copyright holder.\n* Apart from the remix rights granted under this license, nothing in\nthis license impairs or restricts the author's moral rights.\nFor more deatils on this data set, see\nhttp:\/\/promisedata.org\/repository\/data\/kc2\/kc2.arff", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": "Mike Chapman", "contributor": null, "date": "2014-10-06 23:57:50", "update_comment": null, "last_update": "2014-10-06 23:57:50", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/53954\/mw1.arff", "default_target_attribute": "c", "row_id_attribute": null, "ignore_attribute": null, "runs": 765, "suggest": { "input": [ "mw1", "%-*- text -*- %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% This is a PROMISE data set made publicly available in order to encourage repeatable, verifiable, refutable, and\/or improvable predictive models of software engineering. If you publish material based on PROMISE data sets then, please follow the acknowledgment guidelines posted on the PROMISE repository web page http:\/\/promise.site.uottawa.ca\/SERepository . %%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%% " ], "weight": 5 }, "qualities": { "NumberOfInstances": 403, "NumberOfFeatures": 38, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 37, "NumberOfSymbolicFeatures": 1, "MeanSkewnessOfNumericAtts": 2.519298523470371, "Quartile1StdDevOfNumericAtts": 1.5770367383104706, "REPTreeDepth2AUC": 0.49193548387096775, "CfsSubsetEval_kNN1NErrRate": 0.09429280397022333, "kNN1NAUC": 0.6328477280610475, "J48.001.Kappa": 0.25906735751295373, "MeanStdDevOfNumericAtts": 556.7656238748065, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": 0.07692307692307693, "CfsSubsetEval_kNN1NKappa": 0.16271186440677993, "kNN1NErrRate": 0.10173697270471464, "MajorityClassPercentage": 92.3076923076923, "MinAttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 6.090989938758231, "REPTreeDepth2Kappa": 0, "ClassEntropy": 0.39124356362925566, "kNN1NKappa": 0.22641509433962306, "MajorityClassSize": 372, "MinKurtosisOfNumericAtts": -1.5270845224916383, "Quartile2MeansOfNumericAtts": 4.940446650124069, "REPTreeDepth3AUC": 0.49193548387096775, "DecisionStumpAUC": 0.6504942767950052, "MaxAttributeEntropy": null, "MinMeansOfNumericAtts": 0.0521091811414392, "Quartile2MutualInformation": null, "REPTreeDepth3ErrRate": 0.07692307692307693, "DecisionStumpErrRate": 0.07692307692307693, "MaxKurtosisOfNumericAtts": 57.15492775272825, "MinMutualInformation": null, "Quartile2SkewnessOfNumericAtts": 2.2136828211670743, "REPTreeDepth3Kappa": 0, "DecisionStumpKappa": 0, "MaxMeansOfNumericAtts": 7985.329454094293, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 2.631578947368421, "Quartile2StdDevOfNumericAtts": 6.4433442067949604, "RandomTreeDepth1AUC": 0.5556711758584808, "Dimensionality": 0.09429280397022333, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -1.271894871135886, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "RandomTreeDepth1ErrRate": 0.13399503722084366, "EquivalentNumberOfAtts": null, "MaxSkewnessOfNumericAtts": 7.297129068550936, "MinStdDevOfNumericAtts": 0.09267538153937513, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 16.67786576592366, "AutoCorrelation": 0.8557213930348259, "RandomTreeDepth1Kappa": 0.08355091383812, "J48.00001.AUC": 0.5270551508844953, "MaxStdDevOfNumericAtts": 18556.572604227917, "MinorityClassPercentage": 7.6923076923076925, "PercentageOfNumericFeatures": 97.36842105263158, "Quartile3MeansOfNumericAtts": 20.629032258064512, "CfsSubsetEval_DecisionStumpAUC": 0.6325442247658689, "RandomTreeDepth2AUC": 0.5556711758584808, "J48.00001.ErrRate": 0.08188585607940446, "MeanAttributeEntropy": null, "MinorityClassSize": 31, "PercentageOfSymbolicFeatures": 2.631578947368421, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": 0.09429280397022333, "RandomTreeDepth2ErrRate": 0.13399503722084366, "J48.00001.Kappa": 0.25906735751295373, "MeanKurtosisOfNumericAtts": 11.651332911754626, "NaiveBayesAUC": 0.7054150324181541, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 3.2373380653606167, "CfsSubsetEval_DecisionStumpKappa": 0.16271186440677993, "RandomTreeDepth2Kappa": 0.08355091383812, "J48.0001.AUC": 0.5270551508844953, "MeanMeansOfNumericAtts": 251.88784186171284, "NaiveBayesErrRate": 0.15632754342431762, "Quartile1KurtosisOfNumericAtts": 3.890388366315668, "Quartile3StdDevOfNumericAtts": 19.26994448926139, "CfsSubsetEval_NaiveBayesAUC": 0.6325442247658689, "RandomTreeDepth3AUC": 0.5556711758584808, "J48.0001.ErrRate": 0.08188585607940446, "MeanMutualInformation": null, "NaiveBayesKappa": 0.26016260162601623, "Quartile1MeansOfNumericAtts": 1.1844913151364764, "REPTreeDepth1AUC": 0.49193548387096775, "CfsSubsetEval_NaiveBayesErrRate": 0.09429280397022333, "RandomTreeDepth3ErrRate": 0.13399503722084366, "J48.0001.Kappa": 0.25906735751295373, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": 0.07692307692307693, "CfsSubsetEval_NaiveBayesKappa": 0.16271186440677993, "RandomTreeDepth3Kappa": 0.08355091383812, "J48.001.AUC": 0.5270551508844953, "MeanNominalAttDistinctValues": 2, "Quartile1SkewnessOfNumericAtts": 1.7144912268055643, "REPTreeDepth1Kappa": 0, "CfsSubsetEval_kNN1NAUC": 0.6325442247658689, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.08188585607940446 }, "tags": [ { "tag": "Chemistry", "uploader": "38960" }, { "tag": "Life Science", "uploader": "38960" }, { "tag": "PROMISE", "uploader": "24659" }, { "tag": "study_1", "uploader": "2" }, { "tag": "study_123", "uploader": "3886" }, { "tag": "study_41", "uploader": "1" }, { "tag": "study_52", "uploader": "64" }, { "tag": "study_7", "uploader": "64" }, { "tag": "study_88", "uploader": "4209" }, { "tag": "study_236", "uploader": "0" }, { "tag": "study_442", "uploader": "0" }, { "tag": "study_443", "uploader": "0" }, { "tag": "study_444", "uploader": "0" }, { "tag": "study_445", "uploader": "0" } ], "features": [ { "name": "c", "index": "37", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "FALSE", "TRUE" ], [ [ "372", "0" ], [ "0", "31" ] ] ] }, { "name": "LOC_BLANK", "index": "0", "type": "numeric", "distinct": "27", "missing": "0", "min": "0", "max": "34", "mean": "5", "stdev": "5" }, { "name": "BRANCH_COUNT", "index": "1", "type": "numeric", "distinct": "33", "missing": "0", "min": "1", "max": "50", "mean": "7", "stdev": "8" }, { "name": "CALL_PAIRS", "index": "2", "type": "numeric", "distinct": "24", "missing": "0", "min": "0", "max": "25", "mean": "4", "stdev": "4" }, { "name": "LOC_CODE_AND_COMMENT", "index": "3", "type": "numeric", "distinct": "8", "missing": "0", "min": "0", "max": "16", "mean": "0", "stdev": "2" }, { "name": "LOC_COMMENTS", "index": "4", "type": "numeric", "distinct": "27", "missing": "0", "min": "0", "max": "42", "mean": "4", "stdev": "6" }, { "name": "CONDITION_COUNT", "index": "5", "type": "numeric", "distinct": "31", "missing": "0", "min": "0", "max": "82", "mean": "9", "stdev": "13" }, { "name": "CYCLOMATIC_COMPLEXITY", "index": "6", "type": "numeric", "distinct": "25", "missing": "0", "min": "1", "max": "28", "mean": "5", "stdev": "5" }, { "name": "CYCLOMATIC_DENSITY", "index": "7", "type": "numeric", "distinct": "53", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "DECISION_COUNT", "index": "8", "type": "numeric", "distinct": "18", "missing": "0", "min": "0", "max": "36", "mean": "4", "stdev": "6" }, { "name": "DECISION_DENSITY", "index": "9", "type": "numeric", "distinct": "29", "missing": "0", "min": "0", "max": "12", "mean": "2", "stdev": "1" }, { "name": "DESIGN_COMPLEXITY", "index": "10", "type": "numeric", "distinct": "20", "missing": "0", "min": "1", "max": "26", "mean": "3", "stdev": "4" }, { "name": "DESIGN_DENSITY", "index": "11", "type": "numeric", "distinct": "39", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "EDGE_COUNT", "index": "12", "type": "numeric", "distinct": "73", "missing": "0", "min": "1", "max": "134", "mean": "19", "stdev": "20" }, { "name": "ESSENTIAL_COMPLEXITY", "index": "13", "type": "numeric", "distinct": "16", "missing": "0", "min": "1", "max": "23", "mean": "2", "stdev": "3" }, { "name": "ESSENTIAL_DENSITY", "index": "14", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "LOC_EXECUTABLE", "index": "15", "type": "numeric", "distinct": "71", "missing": "0", "min": "2", "max": "112", "mean": "20", "stdev": "18" }, { "name": "PARAMETER_COUNT", "index": "16", "type": "numeric", "distinct": "7", "missing": "0", "min": "0", "max": "6", "mean": "1", "stdev": "1" }, { "name": "HALSTEAD_CONTENT", "index": "17", "type": "numeric", "distinct": "354", "missing": "0", "min": "6", "max": "234", "mean": "41", "stdev": "30" }, { "name": "HALSTEAD_DIFFICULTY", "index": "18", "type": "numeric", "distinct": "278", "missing": "0", "min": "2", "max": "48", "mean": "10", "stdev": "8" }, { "name": "HALSTEAD_EFFORT", "index": "19", "type": "numeric", "distinct": "363", "missing": "0", "min": "17", "max": "194482", "mean": "7985", "stdev": "18557" }, { "name": "HALSTEAD_ERROR_EST", "index": "20", "type": "numeric", "distinct": "63", "missing": "0", "min": "0", "max": "2", "mean": "0", "stdev": "0" }, { "name": "HALSTEAD_LENGTH", "index": "21", "type": "numeric", "distinct": "163", "missing": "0", "min": "5", "max": "889", "mean": "84", "stdev": "89" }, { "name": "HALSTEAD_LEVEL", "index": "22", "type": "numeric", "distinct": "43", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "HALSTEAD_PROG_TIME", "index": "23", "type": "numeric", "distinct": "361", "missing": "0", "min": "1", "max": "10805", "mean": "444", "stdev": "1031" }, { "name": "HALSTEAD_VOLUME", "index": "24", "type": "numeric", "distinct": "332", "missing": "0", "min": "12", "max": "6182", "mean": "459", "stdev": "589" }, { "name": "MAINTENANCE_SEVERITY", "index": "25", "type": "numeric", "distinct": "42", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "MODIFIED_CONDITION_COUNT", "index": "26", "type": "numeric", "distinct": "21", "missing": "0", "min": "0", "max": "23", "mean": "3", "stdev": "4" }, { "name": "MULTIPLE_CONDITION_COUNT", "index": "27", "type": "numeric", "distinct": "32", "missing": "0", "min": "0", "max": "48", "mean": "5", "stdev": "7" }, { "name": "NODE_COUNT", "index": "28", "type": "numeric", "distinct": "60", "missing": "0", "min": "2", "max": "110", "mean": "17", "stdev": "16" }, { "name": "NORMALIZED_CYLOMATIC_COMPLEXITY", "index": "29", "type": "numeric", "distinct": "45", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "NUM_OPERANDS", "index": "30", "type": "numeric", "distinct": "106", "missing": "0", "min": "2", "max": "396", "mean": "37", "stdev": "40" }, { "name": "NUM_OPERATORS", "index": "31", "type": "numeric", "distinct": "122", "missing": "0", "min": "3", "max": "493", "mean": "47", "stdev": "50" }, { "name": "NUM_UNIQUE_OPERANDS", "index": "32", "type": "numeric", "distinct": "64", "missing": "0", "min": "2", "max": "107", "mean": "21", "stdev": "17" }, { "name": "NUM_UNIQUE_OPERATORS", "index": "33", "type": "numeric", "distinct": "31", "missing": "0", "min": "3", "max": "44", "mean": "11", "stdev": "6" }, { "name": "NUMBER_OF_LINES", "index": "34", "type": "numeric", "distinct": "92", "missing": "0", "min": "4", "max": "171", "mean": "31", "stdev": "27" }, { "name": "PERCENT_COMMENTS", "index": "35", "type": "numeric", "distinct": "151", "missing": "0", "min": "0", "max": "85", "mean": "17", "stdev": "16" }, { "name": "LOC_TOTAL", "index": "36", "type": "numeric", "distinct": "70", "missing": "0", "min": "3", "max": "112", "mean": "21", "stdev": "18" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 10, "total_downloads": 10, "reach": 10, "reuse": 15, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 15 }