{ "data_id": "1405", "name": "BNG(lymph,5000,1)", "exact_name": "BNG(lymph,5000,1)", "version": 1, "version_label": null, "description": "", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": "\"Geoffrey Holmes\",\"Bernhard Pfahringer\",\"Jan van Rijn\",\"Joaquin Vanschoren\"", "contributor": null, "date": "2015-02-23 03:35:55", "update_comment": null, "last_update": "2015-02-23 03:35:55", "licence": "public domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/584478\/BNG_lymph_5000_1.arff", "kaggle_url": null, "default_target_attribute": "class", "row_id_attribute": null, "ignore_attribute": null, "runs": 27, "suggest": { "input": [ "BNG(lymph,5000,1)", " " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1000000, "NumberOfFeatures": 19, "NumberOfClasses": 4, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 3, "NumberOfSymbolicFeatures": 16, "Quartile2SkewnessOfNumericAtts": 0.5955997960134153, "REPTreeDepth3Kappa": 0.7597084657321161, "DecisionStumpKappa": 0.5805183947403377, "MaxMeansOfNumericAtts": 2.9927388224675746, "MinMutualInformation": 0.00330176008986, "Quartile2StdDevOfNumericAtts": 0.9820142362342611, "RandomTreeDepth1AUC": 0.8630698285202355, "Dimensionality": 1.9e-5, "MaxMutualInformation": 0.3028987688806, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 47.368421052631575, "Quartile3AttributeEntropy": 1.8540533722424688, "RandomTreeDepth1ErrRate": 0.162755, "EquivalentNumberOfAtts": 28.828503996046162, "MaxNominalAttDistinctValues": 8, "MinSkewnessOfNumericAtts": 0.22810541141308213, "PercentageOfInstancesWithMissingValues": 0, "Quartile3KurtosisOfNumericAtts": -0.4897141358020085, "AutoCorrelation": 0.46374446374446376, "RandomTreeDepth1Kappa": 0.6951414455776074, "J48.00001.AUC": 0.9380219648309862, "MaxSkewnessOfNumericAtts": 0.8450797335561597, "MinStdDevOfNumericAtts": 0.8732285683438978, "PercentageOfMissingValues": 0, "Quartile3MeansOfNumericAtts": 2.9927388224675746, "CfsSubsetEval_DecisionStumpAUC": 0.9110970620831691, "RandomTreeDepth2AUC": 0.8630698285202355, "J48.00001.ErrRate": 0.113379, "MaxStdDevOfNumericAtts": 2.046572678417054, "MinorityClassPercentage": 1.6507999999999998, "PercentageOfNumericFeatures": 15.789473684210526, "Quartile3MutualInformation": 0.03013921135778, "CfsSubsetEval_DecisionStumpErrRate": 0.16232, "RandomTreeDepth2ErrRate": 0.162755, "J48.00001.Kappa": 0.7844787796475893, "MeanAttributeEntropy": 1.3385119683695814, "MinorityClassSize": 16508, "PercentageOfSymbolicFeatures": 84.21052631578947, "Quartile3SkewnessOfNumericAtts": 0.8450797335561597, "CfsSubsetEval_DecisionStumpKappa": 0.6876773539289716, "RandomTreeDepth2Kappa": 0.6951414455776074, "J48.0001.AUC": 0.9380219648309862, "MeanKurtosisOfNumericAtts": -0.9560567075702596, "NaiveBayesAUC": 0.9120119885963771, "Quartile1AttributeEntropy": 0.9449056585696294, "Quartile1KurtosisOfNumericAtts": -1.4258673847620875, "Quartile3StdDevOfNumericAtts": 2.046572678417054, "CfsSubsetEval_NaiveBayesAUC": 0.9110970620831691, "RandomTreeDepth3AUC": 0.8630698285202355, "J48.0001.ErrRate": 0.113379, "MeanMeansOfNumericAtts": 2.36308127415568, "NaiveBayesErrRate": 0.184338, "Quartile1MeansOfNumericAtts": 1.7107809999992971, "REPTreeDepth1AUC": 0.9427567563509246, "CfsSubsetEval_NaiveBayesErrRate": 0.16232, "RandomTreeDepth3ErrRate": 0.162755, "J48.0001.Kappa": 0.7844787796475893, "MeanMutualInformation": 0.04357512507999533, "NaiveBayesKappa": 0.6455279116061291, "Quartile1MutualInformation": 0.0128202455442, "REPTreeDepth1ErrRate": 0.125891, "CfsSubsetEval_NaiveBayesKappa": 0.6876773539289716, "RandomTreeDepth3Kappa": 0.6951414455776074, "J48.001.AUC": 0.9380219648309862, "MeanNoiseToSignalRatio": 29.71734082030373, "NumberOfBinaryFeatures": 9, "Quartile1SkewnessOfNumericAtts": 0.22810541141308213, "REPTreeDepth1Kappa": 0.7597084657321161, "CfsSubsetEval_kNN1NAUC": 0.9110970620831691, "StdvNominalAttDistinctValues": 1.591644851508443, "J48.001.ErrRate": 0.113379, "MeanNominalAttDistinctValues": 3, "Quartile1StdDevOfNumericAtts": 0.8732285683438978, "REPTreeDepth2AUC": 0.9427567563509246, "CfsSubsetEval_kNN1NErrRate": 0.16232, "kNN1NAUC": 0.8834376368633466, "J48.001.Kappa": 0.7844787796475893, "MeanSkewnessOfNumericAtts": 0.5562616469942191, "Quartile2AttributeEntropy": 0.9961305413038389, "REPTreeDepth2ErrRate": 0.125891, "CfsSubsetEval_kNN1NKappa": 0.6876773539289716, "kNN1NErrRate": 0.149106, "MajorityClassPercentage": 54.34949999999999, "MeanStdDevOfNumericAtts": 1.3006051609984044, "Quartile2KurtosisOfNumericAtts": -0.9525886021466827, "REPTreeDepth2Kappa": 0.7597084657321161, "ClassEntropy": 1.2562056674968567, "kNN1NKappa": 0.7183270619859807, "MajorityClassSize": 543495, "MinAttributeEntropy": 0.7016785142780103, "Quartile2MeansOfNumericAtts": 2.385724000000169, "REPTreeDepth3AUC": 0.9427567563509246, "DecisionStumpAUC": 0.794005536785028, "MaxAttributeEntropy": 2.943490702280273, "MinKurtosisOfNumericAtts": -1.4258673847620875, "Quartile2MutualInformation": 0.01509962724161, "REPTreeDepth3ErrRate": 0.125891, "DecisionStumpErrRate": 0.216907, "MaxKurtosisOfNumericAtts": -0.4897141358020085, "MinMeansOfNumericAtts": 1.7107809999992971 }, "tags": [ { "uploader": "2", "tag": "artificial" }, { "uploader": "38960", "tag": "Biology" }, { "uploader": "1", "tag": "BNG" }, { "uploader": "38960", "tag": "Health" }, { "uploader": "38960", "tag": "Lymphatic System" }, { "uploader": "38960", "tag": "Medical" } ], "features": [ { "name": "class", "index": "18", "type": "nominal", "distinct": "4", "missing": "0", "target": "1", "distr": [ [ "normal", "metastases", "malign_lymph", "fibrosis" ], [ [ "16508", "0", "0", "0" ], [ "0", "543495", "0", "0" ], [ "0", "0", "409672", "0" ], [ "0", "0", "0", "30325" ] ] ] }, { "name": "lymphatics", "index": "0", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "normal", "arched", "deformed", "displaced" ], [ [ "2997", "28104", "57712", "10622" ], [ "3711", "226841", "102068", "7297" ], [ "7394", "161409", "185506", "7806" ], [ "2406", "127141", "64386", "4600" ] ] ] }, { "name": "block_of_affere", "index": "1", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "9251", "272111", "237772", "19228" ], [ "7257", "271384", "171900", "11097" ] ] ] }, { "name": "bl_of_lymph_c", "index": "2", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "11262", "479499", "299501", "19639" ], [ "5246", "63996", "110171", "10686" ] ] ] }, { "name": "bl_of_lymph_s", "index": "3", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "10182", "292648", "367501", "21910" ], [ "6326", "250847", "42171", "8415" ] ] ] }, { "name": "by_pass", "index": "4", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "5962", "449628", "76207", "15527" ], [ "10546", "93867", "333465", "14798" ] ] ] }, { "name": "extravasates", "index": "5", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "7663", "326214", "191323", "11404" ], [ "8845", "217281", "218349", "18921" ] ] ] }, { "name": "regeneration_of", "index": "6", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "15003", "367067", "243460", "11765" ], [ "1505", "176428", "166212", "18560" ] ] ] }, { "name": "early_uptake_in", "index": "7", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "7196", "314655", "191873", "8376" ], [ "9312", "228840", "217799", "21949" ] ] ] }, { "name": "lym_nodes_dimin", "index": "8", "type": "numeric", "distinct": "3", "missing": "0", "min": "1", "max": "3", "mean": "2", "stdev": "1" }, { "name": "lym_nodes_enlar", "index": "9", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "2", "stdev": "1" }, { "name": "changes_in_lym", "index": "10", "type": "nominal", "distinct": "3", "missing": "0", "distr": [ [ "bean", "oval", "round" ], [ [ "5009", "74799", "47968", "9222" ], [ "4761", "254250", "228810", "12246" ], [ "6738", "214446", "132894", "8857" ] ] ] }, { "name": "defect_in_node", "index": "11", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "no", "lacunar", "lac_margin", "lac_central" ], [ [ "4610", "64016", "61568", "6102" ], [ "4834", "178261", "89114", "9630" ], [ "2842", "158377", "112295", "4857" ], [ "4222", "142841", "146695", "9736" ] ] ] }, { "name": "changes_in_node", "index": "12", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "no", "lacunar", "lac_margin", "lac_central" ], [ [ "3826", "124599", "53855", "4470" ], [ "3207", "152510", "106864", "12584" ], [ "6908", "156046", "114620", "8967" ], [ "2567", "110340", "134333", "4304" ] ] ] }, { "name": "changes_in_stru", "index": "13", "type": "nominal", "distinct": "8", "missing": "0", "distr": [ [ "no", "grainy", "drop_like", "coarse", "diluted", "reticular", "stripped", "faint" ], [ [ "2798", "42658", "35133", "3457" ], [ "2562", "63614", "42063", "3583" ], [ "1933", "80024", "54284", "3616" ], [ "1921", "80116", "55248", "3947" ], [ "1826", "78427", "57717", "4313" ], [ "1869", "42898", "35903", "3559" ], [ "1777", "45060", "49194", "3605" ], [ "1822", "110698", "80130", "4245" ] ] ] }, { "name": "special_forms", "index": "14", "type": "nominal", "distinct": "3", "missing": "0", "distr": [ [ "no", "chalices", "vesicles" ], [ [ "7730", "118843", "87016", "8499" ], [ "4112", "183124", "80477", "9006" ], [ "4666", "241528", "242179", "12820" ] ] ] }, { "name": "dislocation_of", "index": "15", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "9547", "229251", "156796", "15309" ], [ "6961", "314244", "252876", "15016" ] ] ] }, { "name": "exclusion_of_no", "index": "16", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "no", "yes" ], [ [ "8308", "221570", "115642", "10859" ], [ "8200", "321925", "294030", "19466" ] ] ] }, { "name": "no_of_nodes_in", "index": "17", "type": "numeric", "distinct": "301533", "missing": "0", "min": "1", "max": "10", "mean": "3", "stdev": "2" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }