{ "data_id": "18", "name": "mfeat-morphological", "exact_name": "mfeat-morphological", "version": 1, "version_label": "1", "description": "**Author**: Robert P.W. Duin, Department of Applied Physics, Delft University of Technology \r\n**Source**: [UCI](https:\/\/archive.ics.uci.edu\/ml\/datasets\/Multiple+Features) - 1998 \r\n**Please cite**: [UCI](https:\/\/archive.ics.uci.edu\/ml\/citation_policy.html) \r\n\r\n**Multiple Features Dataset: Morphological** \r\nOne of a set of 6 datasets describing features of handwritten numerals (0 - 9) extracted from a collection of Dutch utility maps. Corresponding patterns in different datasets correspond to the same original character. 200 instances per class (for a total of 2,000 instances) have been digitized in binary images. \r\n\r\nIn this dataset, these digits are represented in terms of 6 morphological features. \r\n\r\n### Attribute Information \r\nThe meaning of the features is mostly unknown. They are never named in the original files, and the paper only talks about 'morphological features, such as the number of endpoints'.\r\n\r\n### Relevant Papers \r\nA slightly different version of the database is used in \r\nM. van Breukelen, R.P.W. Duin, D.M.J. Tax, and J.E. den Hartog, Handwritten digit recognition by combined classifiers, Kybernetika, vol. 34, no. 4, 1998, 381-386.\r\n \r\nThe database as is is used in: \r\nA.K. Jain, R.P.W. Duin, J. Mao, Statistical Pattern Recognition: A Review, IEEE Transactions on Pattern Analysis and Machine Intelligence archive, Volume 22 Issue 1, January 2000 \r\n \r\n ", "format": "ARFF", "uploader": "Jan van Rijn", "uploader_id": 1, "visibility": "public", "creator": "Robert P.W. Duin", "contributor": null, "date": "2014-04-06 23:20:37", "update_comment": null, "last_update": "2014-04-06 23:20:37", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/18\/dataset_18_mfeat-morphological.arff", "default_target_attribute": "class", "row_id_attribute": null, "ignore_attribute": null, "runs": 36330, "suggest": { "input": [ "mfeat-morphological", "One of a set of 6 datasets describing features of handwritten numerals (0 - 9) extracted from a collection of Dutch utility maps. Corresponding patterns in different datasets correspond to the same original character. 200 instances per class (for a total of 2,000 instances) have been digitized in binary images. In this dataset, these digits are represented in terms of 6 morphological features. ### Attribute Information The meaning of the features is mostly unknown. They are never named in the or " ], "weight": 5 }, "qualities": { "NumberOfInstances": 2000, "NumberOfFeatures": 7, "NumberOfClasses": 10, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 6, "NumberOfSymbolicFeatures": 1, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": 0.2935, "CfsSubsetEval_kNN1NKappa": 0.6722222222222222, "kNN1NErrRate": 0.3295, "MajorityClassPercentage": 10, "MeanStdDevOfNumericAtts": 630.90708251402, "Quartile2KurtosisOfNumericAtts": -0.6352635311790746, "REPTreeDepth2Kappa": 0.6738888888888889, "ClassEntropy": 3.321928094887362, "kNN1NKappa": 0.6338888888888888, "MajorityClassSize": 200, "MinAttributeEntropy": null, "Quartile2MeansOfNumericAtts": 1.686534392555002, "REPTreeDepth3AUC": 0.9442476388888889, "DecisionStumpAUC": 0.7612499999999999, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.0383559313284294, "Quartile2MutualInformation": null, "REPTreeDepth3ErrRate": 0.2935, "DecisionStumpErrRate": 0.8015, "MaxKurtosisOfNumericAtts": 0.0794938700561878, "MinMeansOfNumericAtts": 0.49249999999999505, "Quartile2SkewnessOfNumericAtts": 0.6245331546193721, "REPTreeDepth3Kappa": 0.6738888888888889, "DecisionStumpKappa": 0.10944444444444444, "MaxMeansOfNumericAtts": 6155.200435156556, "MinMutualInformation": null, "PercentageOfBinaryFeatures": 0, "Quartile2StdDevOfNumericAtts": 0.9208719889146832, "RandomTreeDepth1AUC": 0.8167275, "Dimensionality": 0.0035, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 10, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "RandomTreeDepth1ErrRate": 0.3345, "EquivalentNumberOfAtts": null, "MaxNominalAttDistinctValues": 10, "MinSkewnessOfNumericAtts": -0.06283666261436584, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": -0.11149071301766611, "AutoCorrelation": 0.9954977488744372, "RandomTreeDepth1Kappa": 0.6283333333333333, "J48.00001.AUC": 0.9114204166666667, "MaxSkewnessOfNumericAtts": 1.0084830014756712, "MinStdDevOfNumericAtts": 0.2913157171953473, "PercentageOfNumericFeatures": 85.71428571428571, "Quartile3MeansOfNumericAtts": 1656.114273214139, "CfsSubsetEval_DecisionStumpAUC": 0.9114204166666667, "RandomTreeDepth2AUC": 0.8167275, "J48.00001.ErrRate": 0.295, "MaxStdDevOfNumericAtts": 3757.634467006599, "MinorityClassPercentage": 10, "PercentageOfSymbolicFeatures": 14.285714285714285, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": 0.295, "RandomTreeDepth2ErrRate": 0.3345, "J48.00001.Kappa": 0.6722222222222222, "MeanAttributeEntropy": null, "MinorityClassSize": 200, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 0.7676581134191288, "CfsSubsetEval_DecisionStumpKappa": 0.6722222222222222, "RandomTreeDepth2Kappa": 0.6283333333333333, "J48.0001.AUC": 0.9114204166666667, "MeanKurtosisOfNumericAtts": -0.536236922624337, "NaiveBayesAUC": 0.9512127777777779, "Quartile1KurtosisOfNumericAtts": -0.8692491113871175, "Quartile3StdDevOfNumericAtts": 958.1661269687643, "CfsSubsetEval_NaiveBayesAUC": 0.9114204166666667, "RandomTreeDepth3AUC": 0.8167275, "J48.0001.ErrRate": 0.295, "MeanMeansOfNumericAtts": 1052.6997316402776, "NaiveBayesErrRate": 0.2995, "Quartile1MeansOfNumericAtts": 0.6582499999999927, "REPTreeDepth1AUC": 0.9442476388888889, "CfsSubsetEval_NaiveBayesErrRate": 0.295, "RandomTreeDepth3ErrRate": 0.3345, "J48.0001.Kappa": 0.6722222222222222, "MeanMutualInformation": null, "NaiveBayesKappa": 0.6672222222222223, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": 0.2935, "CfsSubsetEval_NaiveBayesKappa": 0.6722222222222222, "RandomTreeDepth3Kappa": 0.6283333333333333, "J48.001.AUC": 0.9114204166666667, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 0, "Quartile1SkewnessOfNumericAtts": 0.21477131477248879, "REPTreeDepth1Kappa": 0.6738888888888889, "CfsSubsetEval_kNN1NAUC": 0.9114204166666667, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.295, "MeanNominalAttDistinctValues": 10, "Quartile1StdDevOfNumericAtts": 0.571544999056086, "REPTreeDepth2AUC": 0.9442476388888889, "CfsSubsetEval_kNN1NErrRate": 0.295, "kNN1NAUC": 0.8227808333333333, "J48.001.Kappa": 0.6722222222222222, "MeanSkewnessOfNumericAtts": 0.5315671843447396 }, "tags": [ { "uploader": "38960", "tag": "Machine Learning" }, { "uploader": "1", "tag": "OpenML-CC18" }, { "uploader": "348", "tag": "OpenML100" }, { "uploader": "2", "tag": "study_1" }, { "uploader": "3886", "tag": "study_123" }, { "uploader": "64", "tag": "study_14" }, { "uploader": "1", "tag": "study_34" }, { "uploader": "1", "tag": "study_37" }, { "uploader": "1", "tag": "study_41" }, { "uploader": "64", "tag": "study_52" }, { "uploader": "64", "tag": "study_7" }, { "uploader": "1856", "tag": "study_70" }, { "uploader": "3198", "tag": "study_76" }, { "uploader": "1935", "tag": "study_98" }, { "uploader": "1", "tag": "study_99" } ], "features": [ { "name": "class", "index": "6", "type": "nominal", "distinct": "10", "missing": "0", "target": "1", "distr": [ [ "1", "2", "3", "4", "5", "6", "7", "8", "9", "10" ], [ [ "200", "0", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "200", "0", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "200", "0", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "200", "0", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "200", "0", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "200", "0", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "200", "0", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "200", "0", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "200", "0" ], [ "0", "0", "0", "0", "0", "0", "0", "0", "0", "200" ] ] ] }, { "name": "att1", "index": "0", "type": "numeric", "distinct": "3", "missing": "0", "min": "0", "max": "2", "mean": "0", "stdev": "1" }, { "name": "att2", "index": "1", "type": "numeric", "distinct": "7", "missing": "0", "min": "0", "max": "6", "mean": "2", "stdev": "1" }, { "name": "att3", "index": "2", "type": "numeric", "distinct": "6", "missing": "0", "min": "0", "max": "5", "mean": "1", "stdev": "1" }, { "name": "att4", "index": "3", "type": "numeric", "distinct": "1717", "missing": "0", "min": "100", "max": "231", "mean": "156", "stdev": "25" }, { "name": "att5", "index": "4", "type": "numeric", "distinct": "1886", "missing": "0", "min": "1", "max": "3", "mean": "2", "stdev": "0" }, { "name": "att6", "index": "5", "type": "numeric", "distinct": "1888", "missing": "0", "min": "1440", "max": "17572", "mean": "6155", "stdev": "3758" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }