{ "data_id": "46336", "name": "hayes-roth_clean", "exact_name": "hayes-roth_clean", "version": 1, "version_label": null, "description": "**Author**: Barbara and Frederick Hayes-Roth \n \n**Source**: [original](https:\/\/archive.ics.uci.edu\/ml\/datasets\/Hayes-Roth) - \n**Please cite**: \n\nHayes-Roth Database\n\nThis is a merged version of the separate train and test set which are usually distributed. On OpenML this train-test split can be found as one of the possible tasks.\n\nSource Information: \n(a) Creators: Barbara and Frederick Hayes-Roth \n(b) Donor: David W. Aha (aha@ics.uci.edu) (714) 856-8779 \n(c) Date: March, 1989 \n\nAttribute Information: \n-- 1. name: distinct for each instance and represented numerically \n-- 2. hobby: nominal values ranging between 1 and 3 \n-- 3. age: nominal values ranging between 1 and 4 \n-- 4. educational level: nominal values ranging between 1 and 4 \n-- 5. marital status: nominal values ranging between 1 and 4 \n-- 6. class: nominal value between 1 and 3 \n\nDetailed description of the experiment: \n1. 3 categories (1, 2, and neither -- which I call 3) \n-- some of the instances could be classified in either class 1 or 2, and they have been evenly distributed between the two classes \n2. 5 Attributes \n-- A. name (a randomly-generated number between 1 and 132) \n-- B. hobby (a randomly-generated number between 1 and 3) \n-- C. age (a number between 1 and 4) \n-- D. education level (a number between 1 and 4) \n-- E. marital status (a number between 1 and 4) \n3. Classification: \n-- only attributes C-E are diagnostic; values for A and B are ignored \n-- Class Neither: if a 4 occurs for any attribute C-E \n-- Class 1: Otherwise, if (# of 1's)>(# of 2's) for attributes C-E \n-- Class 2: Otherwise, if (# of 2's)>(# of 1's) for attributes C-E \n-- Either 1 or 2: Otherwise, if (# of 2's)=(# of 1's) for attributes C-E \n4. Prototypes: \n-- Class 1: 111 \n-- Class 2: 222 \n-- Class Either: 333 \n-- Class Neither: 444\n-----\nWe have redefined the number of classes to account for the real number of observations.", "format": "arff", "uploader": "Bruno Belucci Teixeira", "uploader_id": 30703, "visibility": "public", "creator": "\"Barbara and Frederick Hayes-Roth\"", "contributor": "\"Bruno Belucci\"", "date": "2024-09-05 17:26:46", "update_comment": null, "last_update": "2024-09-05 17:26:46", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/api.openml.org\/data\/download\/22120905\/dataset", "default_target_attribute": "class", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "hayes-roth_clean", "Hayes-Roth Database This is a merged version of the separate train and test set which are usually distributed. On OpenML this train-test split can be found as one of the possible tasks. Source Information: (a) Creators: Barbara and Frederick Hayes-Roth (b) Donor: David W. Aha (aha@ics.uci.edu) (714) 856-8779 (c) Date: March, 1989 Attribute Information: -- 1. name: distinct for each instance and represented numerically -- 2. hobby: nominal values ranging between 1 and 3 -- 3. age: nominal values " ], "weight": 5 }, "qualities": { "NumberOfInstances": 160, "NumberOfFeatures": 5, "NumberOfClasses": 3, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 4, "NumberOfSymbolicFeatures": 1, "AutoCorrelation": 0.4088050314465409, "PercentageOfMissingValues": 0, "Dimensionality": 0.03125, "PercentageOfNumericFeatures": 80, "MajorityClassPercentage": 40.625, "PercentageOfSymbolicFeatures": 20, "MajorityClassSize": 65, "MinorityClassPercentage": 19.375, "MinorityClassSize": 31, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0 }, "tags": [], "features": [ { "name": "class", "index": "4", "type": "nominal", "distinct": "3", "missing": "0", "target": "1", "distr": [ [ "1", "2", "3" ], [ [ "65", "0", "0" ], [ "0", "64", "0" ], [ "0", "0", "31" ] ] ] }, { "name": "hobby", "index": "0", "type": "numeric", "distinct": "3", "missing": "0", "min": "1", "max": "3", "mean": "2", "stdev": "1" }, { "name": "age", "index": "1", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "2", "stdev": "1" }, { "name": "educational_level", "index": "2", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "2", "stdev": "1" }, { "name": "marital_status", "index": "3", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "2", "stdev": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }