{ "data_id": "467", "name": "analcatdata_japansolvent", "exact_name": "analcatdata_japansolvent", "version": 1, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nanalcatdata A collection of data sets used in the book \"Analyzing Categorical Data,\"\nby Jeffrey S. Simonoff, Springer-Verlag, New York, 2003. The submission\nconsists of a zip file containing two versions of each of 84 data sets,\nplus this README file. Each data set is given in comma-delimited ASCII\n(.csv) form, and Microsoft Excel (.xls) form.\n\nNOTICE: These data sets may be used freely for scientific, educational and\/or\nnoncommercial purposes, provided suitable acknowledgment is given (by citing\nthe above-named reference).\n\nFurther details concerning the book, including information on statistical software\n(including sample S-PLUS\/R and SAS code), are available at the web site\n\nhttp:\/\/www.stern.nyu.edu\/~jsimonof\/AnalCatData\n\n\nInformation about the dataset\nCLASSTYPE: nominal\nCLASSINDEX: 2\n\n\nNote: Quotes, Single-Quotes and Backslashes were removed, Blanks replaced\nwith Underscores", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": "Jeffrey S. Simonoff", "contributor": null, "date": "2014-09-28 23:51:21", "update_comment": "ignore feature", "last_update": "2014-09-29 02:06:24", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/52579\/analcatdata_japansolvent.arff", "default_target_attribute": "Solvent", "row_id_attribute": null, "ignore_attribute": "\"Firm\"", "runs": 103, "suggest": { "input": [ "analcatdata_japansolvent", "analcatdata A collection of data sets used in the book \"Analyzing Categorical Data,\" by Jeffrey S. Simonoff, Springer-Verlag, New York, 2003. The submission consists of a zip file containing two versions of each of 84 data sets, plus this README file. Each data set is given in comma-delimited ASCII (.csv) form, and Microsoft Excel (.xls) form. NOTICE: These data sets may be used freely for scientific, educational and\/or noncommercial purposes, provided suitable acknowledgment is given (by citing " ], "weight": 5 }, "qualities": { "NumberOfInstances": 52, "NumberOfFeatures": 9, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 8, "NumberOfSymbolicFeatures": 1, "MeanSkewnessOfNumericAtts": -1.8963170948661292, "Quartile1StdDevOfNumericAtts": 0.1648560503784528, "REPTreeDepth2AUC": 0.8081481481481482, "CfsSubsetEval_kNN1NErrRate": 0.23076923076923078, "kNN1NAUC": 0.7044444444444444, "J48.001.Kappa": 0.6182085168869311, "MeanStdDevOfNumericAtts": 0.4923599948139881, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": 0.21153846153846154, "CfsSubsetEval_kNN1NKappa": 0.536404160475483, "kNN1NErrRate": 0.28846153846153844, "MajorityClassPercentage": 51.92307692307693, "MinAttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 9.105779075481093, "REPTreeDepth2Kappa": 0.5794117647058823, "ClassEntropy": 0.9989326546260581, "kNN1NKappa": 0.4144144144144145, "MajorityClassSize": 27, "MinKurtosisOfNumericAtts": 2.4819953768125926, "Quartile2MeansOfNumericAtts": -0.041398076923076926, "REPTreeDepth3AUC": 0.8081481481481482, "DecisionStumpAUC": 0.8088888888888888, "MaxAttributeEntropy": null, "MinMeansOfNumericAtts": -0.15745, "Quartile2MutualInformation": null, "REPTreeDepth3ErrRate": 0.21153846153846154, "DecisionStumpErrRate": 0.19230769230769232, "MaxKurtosisOfNumericAtts": 16.59695191408378, "MinMutualInformation": null, "Quartile2SkewnessOfNumericAtts": -2.595332419270574, "REPTreeDepth3Kappa": 0.5794117647058823, "DecisionStumpKappa": 0.6182085168869311, "MaxMeansOfNumericAtts": 1.4091384615384615, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 11.11111111111111, "Quartile2StdDevOfNumericAtts": 0.4720719874306799, "RandomTreeDepth1AUC": 0.7651851851851852, "Dimensionality": 0.17307692307692307, "MaxMutualInformation": null, "MinSkewnessOfNumericAtts": -3.5820091265162195, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "RandomTreeDepth1ErrRate": 0.25, "EquivalentNumberOfAtts": null, "MaxNominalAttDistinctValues": 2, "MinStdDevOfNumericAtts": 0.13893984678860496, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 14.17031485609937, "AutoCorrelation": 0.9803921568627451, "RandomTreeDepth1Kappa": 0.5029411764705882, "J48.00001.AUC": 0.8088888888888888, "MaxSkewnessOfNumericAtts": 1.5153236456169954, "MinorityClassPercentage": 48.07692307692308, "PercentageOfNumericFeatures": 88.88888888888889, "Quartile3MeansOfNumericAtts": 0.11927932692307695, "CfsSubsetEval_DecisionStumpAUC": 0.8088888888888888, "RandomTreeDepth2AUC": 0.7703703703703705, "J48.00001.ErrRate": 0.19230769230769232, "MaxStdDevOfNumericAtts": 0.877689796948885, "MinorityClassSize": 25, "PercentageOfSymbolicFeatures": 11.11111111111111, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": 0.19230769230769232, "RandomTreeDepth2ErrRate": 0.21153846153846154, "J48.00001.Kappa": 0.6182085168869311, "MeanAttributeEntropy": null, "NaiveBayesAUC": 0.930014245014245, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 0.15744581378762534, "CfsSubsetEval_DecisionStumpKappa": 0.6182085168869311, "RandomTreeDepth2Kappa": 0.5781710914454277, "J48.0001.AUC": 0.8088888888888888, "MeanKurtosisOfNumericAtts": 8.966130687202481, "NaiveBayesErrRate": 0.23076923076923078, "Quartile1KurtosisOfNumericAtts": 3.1509616246860106, "Quartile3StdDevOfNumericAtts": 0.8410933772633731, "CfsSubsetEval_NaiveBayesAUC": 0.8066951566951567, "RandomTreeDepth3AUC": 0.8007407407407409, "J48.0001.ErrRate": 0.19230769230769232, "MeanMeansOfNumericAtts": 0.14231802884615383, "MeanMutualInformation": null, "NaiveBayesKappa": 0.5322338830584709, "Quartile1MeansOfNumericAtts": -0.1072826923076923, "REPTreeDepth1AUC": 0.8081481481481482, "CfsSubsetEval_NaiveBayesErrRate": 0.23076923076923078, "RandomTreeDepth3ErrRate": 0.19230769230769232, "J48.0001.Kappa": 0.6182085168869311, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": 0.21153846153846154, "CfsSubsetEval_NaiveBayesKappa": 0.5377777777777778, "RandomTreeDepth3Kappa": 0.6170839469808542, "J48.001.AUC": 0.8088888888888888, "MeanNominalAttDistinctValues": 2, "Quartile1SkewnessOfNumericAtts": -3.409692191247869, "REPTreeDepth1Kappa": 0.5794117647058823, "CfsSubsetEval_kNN1NAUC": 0.7674074074074075, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.19230769230769232 }, "tags": [ { "tag": "mythbusting_1", "uploader": "1" }, { "tag": "study_1", "uploader": "2" }, { "tag": "study_15", "uploader": "939" }, { "tag": "study_20", "uploader": "939" } ], "topics": [ { "topic": "Book-based", "uploader": "8111" } ], "features": [ { "name": "Solvent", "index": "1", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "0", "1" ], [ [ "25", "0" ], [ "0", "27" ] ] ] }, { "name": "Firm", "index": "0", "type": "nominal", "distinct": "52", "missing": "0", "ignore": "1", "distr": [ [ "Aiden", "Ando_Iron_Works", "Asahi_Seiko", "Chuo_Seikakusho", "Chuyu", "Dai-Nippon_Sugar_Mfg", "Doko_Spinning", "Fuji_Seito", "Fujiya_Electric", "Gisen", "Hamaguchi_Senco", "Hikari_Bussiness_For", "Hitachi_Ferrite", "Ishii_Precision_Tool", "Japan_Drop_Forge", "Kohjin", "Kojima_Iron_Works", "Maeda_Metal_Ind.", "Mamiya_Camera", "Marine_Techno", "Meiji_Sugar_Mfg.", "Metalart", "Mie_Horo", "Mino_Ceramic", "Miroku_Firearms_Mfg.", "Monde_Distilleries", "Morio_Denki", "Nagahama_Gohan", "Nagoya_Lumber", "Nagoya_Seito", "Nankai_Worsted_Spin", "Nihon_Aeroplane_Mfg.", "Nihon_Sugar_Refining", "Nippon_Orimono_Kato", "Nippon_Tile_Industri", "Osaka_Meter", "Osaka_Yogyo", "SR_Suntour", "Saga_Paper_Board", "Sakonic", "Sakurai_Iron_Works", "Sankyo_Special_Steel", "Sansei_Mfg.", "Shoun_Machine_Tool", "Takeni_Senka", "Toa_Electronics", "Tokuyama", "Toyo_Sugar", "Tsunoda", "Uemori_Agricultural", "Yamato_Woolen_Textil", "Yoshida_Machine_Tool" ], [ [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ], [ "0", "1" ], [ "1", "0" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "0", "1" ], [ "1", "0" ], [ "1", "0" ], [ "1", "0" ] ] ] }, { "name": "EBIT\/TA", "index": "2", "type": "numeric", "distinct": "49", "missing": "0", "min": "-1", "max": "0", "mean": "0", "stdev": "0" }, { "name": "NI\/TC", "index": "3", "type": "numeric", "distinct": "52", "missing": "0", "min": "-4", "max": "1", "mean": "0", "stdev": "1" }, { "name": "Sales\/TA", "index": "4", "type": "numeric", "distinct": "52", "missing": "0", "min": "0", "max": "4", "mean": "1", "stdev": "1" }, { "name": "EBIT\/Sales", "index": "5", "type": "numeric", "distinct": "47", "missing": "0", "min": "-1", "max": "0", "mean": "0", "stdev": "0" }, { "name": "NI\/Sales", "index": "6", "type": "numeric", "distinct": "45", "missing": "0", "min": "-1", "max": "0", "mean": "0", "stdev": "0" }, { "name": "WC\/TA", "index": "7", "type": "numeric", "distinct": "49", "missing": "0", "min": "-2", "max": "0", "mean": "0", "stdev": "0" }, { "name": "Equity\/TL", "index": "8", "type": "numeric", "distinct": "51", "missing": "0", "min": "-1", "max": "2", "mean": "0", "stdev": "0" }, { "name": "Equity\/TA", "index": "9", "type": "numeric", "distinct": "49", "missing": "0", "min": "-4", "max": "1", "mean": "0", "stdev": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }