{ "data_id": "453", "name": "analcatdata_bondrate", "exact_name": "analcatdata_bondrate", "version": 1, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nanalcatdata A collection of data sets used in the book \"Analyzing Categorical Data,\"\nby Jeffrey S. Simonoff, Springer-Verlag, New York, 2003. The submission\nconsists of a zip file containing two versions of each of 84 data sets,\nplus this README file. Each data set is given in comma-delimited ASCII\n(.csv) form, and Microsoft Excel (.xls) form.\n\nNOTICE: These data sets may be used freely for scientific, educational and\/or\nnoncommercial purposes, provided suitable acknowledgment is given (by citing\nthe above-named reference).\n\nFurther details concerning the book, including information on statistical software\n(including sample S-PLUS\/R and SAS code), are available at the web site\n\nhttp:\/\/www.stern.nyu.edu\/~jsimonof\/AnalCatData\n\n\nInformation about the dataset\nCLASSTYPE: nominal\nCLASSINDEX: last\n\n\nNote: Quotes, Single-Quotes and Backslashes were removed, Blanks replaced\nwith Underscores", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": "Jeffrey S. Simonoff", "contributor": null, "date": "2014-09-28 23:50:54", "update_comment": "ignore feature", "last_update": "2014-09-29 02:16:37", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/52565\/analcatdata_bondrate.arff", "kaggle_url": null, "default_target_attribute": "Rating", "row_id_attribute": null, "ignore_attribute": "\"City\"", "runs": 32, "suggest": { "input": [ "analcatdata_bondrate", "analcatdata A collection of data sets used in the book \"Analyzing Categorical Data,\" by Jeffrey S. Simonoff, Springer-Verlag, New York, 2003. The submission consists of a zip file containing two versions of each of 84 data sets, plus this README file. Each data set is given in comma-delimited ASCII (.csv) form, and Microsoft Excel (.xls) form. NOTICE: These data sets may be used freely for scientific, educational and\/or noncommercial purposes, provided suitable acknowledgment is given (by citing " ], "weight": 5 }, "qualities": { "NumberOfInstances": 57, "NumberOfFeatures": 11, "NumberOfClasses": 5, "NumberOfMissingValues": 1, "NumberOfInstancesWithMissingValues": 1, "NumberOfNumericFeatures": 4, "NumberOfSymbolicFeatures": 7, "J48.001.ErrRate": 0.42105263157894735, "MeanNominalAttDistinctValues": 5.571428571428571, "Quartile1SkewnessOfNumericAtts": 0.20141980926945627, "REPTreeDepth1Kappa": -0.020370370370370396, "CfsSubsetEval_kNN1NAUC": 0.4843130639570268, "StdvNominalAttDistinctValues": 2.9920529661723827, "J48.001.Kappa": 0, "MeanSkewnessOfNumericAtts": 1.2828319970010231, "Quartile1StdDevOfNumericAtts": 2920.3917720262843, "REPTreeDepth2AUC": 0.540354846391998, "CfsSubsetEval_kNN1NErrRate": 0.42105263157894735, "kNN1NAUC": 0.5181342307503298, "MajorityClassPercentage": 57.89473684210527, "MeanStdDevOfNumericAtts": 788385.2172720972, "Quartile2AttributeEntropy": 2.0992566826171357, "REPTreeDepth2ErrRate": 0.5087719298245614, "CfsSubsetEval_kNN1NKappa": 0, "kNN1NErrRate": 0.543859649122807, "kNN1NKappa": 0.0586041555673947, "MajorityClassSize": 33, "MinAttributeEntropy": 0.8314743880097293, "Quartile2KurtosisOfNumericAtts": 0.7081811289032955, "REPTreeDepth2Kappa": -0.020370370370370396, "ClassEntropy": 1.6819431470376087, "MaxAttributeEntropy": 2.9935181238694586, "MinKurtosisOfNumericAtts": -0.16259574493510742, "Quartile2MeansOfNumericAtts": 49782.254385964916, "REPTreeDepth3AUC": 0.540354846391998, "DecisionStumpAUC": 0.5074428151827532, "MaxKurtosisOfNumericAtts": 14.352345493263488, "MinMeansOfNumericAtts": 16569.947368421053, "Quartile2MutualInformation": 0.32629818140253, "REPTreeDepth3ErrRate": 0.5087719298245614, "DecisionStumpErrRate": 0.45614035087719296, "MaxMeansOfNumericAtts": 2315386.25, "MinMutualInformation": 0.0634174989093, "Quartile2SkewnessOfNumericAtts": 0.7397070784216985, "REPTreeDepth3Kappa": -0.020370370370370396, "DecisionStumpKappa": -0.0013513513513513384, "MaxMutualInformation": 0.41495113227637, "MinNominalAttDistinctValues": 2, "PercentageOfBinaryFeatures": 9.090909090909092, "Quartile2StdDevOfNumericAtts": 6730.822510775339, "RandomTreeDepth1AUC": 0.503664216473814, "Dimensionality": 0.19298245614035087, "MaxNominalAttDistinctValues": 10, "MinSkewnessOfNumericAtts": 0.07721512007614457, "PercentageOfInstancesWithMissingValues": 1.7543859649122806, "Quartile3AttributeEntropy": 2.7709046327097067, "RandomTreeDepth1ErrRate": 0.5614035087719298, "EquivalentNumberOfAtts": 6.221690518952286, "MaxSkewnessOfNumericAtts": 3.5746987110845514, "MinStdDevOfNumericAtts": 2094.4321973564356, "PercentageOfMissingValues": 0.1594896331738437, "Quartile3KurtosisOfNumericAtts": 10.966732706188619, "AutoCorrelation": 0.375, "RandomTreeDepth1Kappa": 0.002188183807439804, "J48.00001.AUC": 0.4843130639570268, "MaxStdDevOfNumericAtts": 3137984.7918694816, "MinorityClassPercentage": 1.7543859649122806, "PercentageOfNumericFeatures": 36.36363636363637, "Quartile3MeansOfNumericAtts": 1750349.9111842103, "CfsSubsetEval_DecisionStumpAUC": 0.4843130639570268, "RandomTreeDepth2AUC": 0.503664216473814, "J48.00001.ErrRate": 0.42105263157894735, "MeanAttributeEntropy": 1.9492671045022836, "MinorityClassSize": 1, "PercentageOfSymbolicFeatures": 63.63636363636363, "Quartile3MutualInformation": 0.412742642039575, "CfsSubsetEval_DecisionStumpErrRate": 0.42105263157894735, "RandomTreeDepth2ErrRate": 0.5614035087719298, "J48.00001.Kappa": 0, "MeanKurtosisOfNumericAtts": 3.901528001533743, "NaiveBayesAUC": 0.49143377548950307, "Quartile1AttributeEntropy": 0.9394160576852717, "Quartile3SkewnessOfNumericAtts": 2.9073691033119156, "CfsSubsetEval_DecisionStumpKappa": 0, "RandomTreeDepth2Kappa": 0.002188183807439804, "J48.0001.AUC": 0.4843130639570268, "MeanMeansOfNumericAtts": 607880.1765350878, "NaiveBayesErrRate": 0.631578947368421, "Quartile1KurtosisOfNumericAtts": 0.029670169509314448, "Quartile3StdDevOfNumericAtts": 2355504.43753349, "CfsSubsetEval_NaiveBayesAUC": 0.4843130639570268, "RandomTreeDepth3AUC": 0.503664216473814, "J48.0001.ErrRate": 0.42105263157894735, "MeanMutualInformation": 0.27033539227226666, "NaiveBayesKappa": -0.021403683424589412, "Quartile1MeansOfNumericAtts": 23508.364035087718, "REPTreeDepth1AUC": 0.540354846391998, "CfsSubsetEval_NaiveBayesErrRate": 0.42105263157894735, "RandomTreeDepth3ErrRate": 0.5614035087719298, "J48.0001.Kappa": 0, "J48.001.AUC": 0.4843130639570268, "MeanNoiseToSignalRatio": 6.2105508942724414, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": 0.075135035488995, "REPTreeDepth1ErrRate": 0.5087719298245614, "CfsSubsetEval_NaiveBayesKappa": 0, "RandomTreeDepth3Kappa": 0.002188183807439804 }, "tags": [ { "uploader": "38960", "tag": "Data Science" }, { "uploader": "2", "tag": "study_1" } ], "topics": [ { "topic": "Book-based", "uploader": "8111" } ], "features": [ { "name": "Rating", "index": "11", "type": "nominal", "distinct": "5", "missing": "0", "target": "1", "distr": [ [ "(1)_AAA", "(2)_AA", "(3)_A", "(4)_BBB", "(5)_BB" ], [ [ "6", "0", "0", "0", "0" ], [ "0", "33", "0", "0", "0" ], [ "0", "0", "12", "0", "0" ], [ "0", "0", "0", "5", "0" ], [ "0", "0", "0", "0", "1" ] ] ] }, { "name": "City", "index": "0", "type": "nominal", "distinct": "57", "missing": "0", "ignore": "1", "distr": [ [ "Allentown", "Atlanta", "Austin", "Bakersfield", "Baltimore", "Birmingham", "Boston", "Buffalo", "Charleston", "Chicago", "Cincinatti", "Cleveland", "Columbus", "Dallas", "Dayton", "Denver", "Detroit", "Durham", "El_Paso", "Grand_Rapids", "Greensboro", "Hartford", "Honolulu", "Houston", "Jacksonville", "Kansas_City", "Knoxville", "Las_Vegas", "Little_Rock", "Los_Angeles", "Louisville", "Memphis", "Miami", "Milwaukee", "New_Haven", "New_York_City", "Norfolk", "Oklahoma_City", "Philadelphia", "Phoenix", "Pittsburgh", "Providence", "Raleigh", "Richmond", "Rochester", "Sacramento", "San_Antonio", "San_Diego", "San_Francisco", "Seattle", "St_Louis", "Syracuse", "Toledo", "Tucson", "Tulsa", "Twin_Cities", "Worcester" ], [ [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "0", "0", "0", "1", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "1", "0", "0", "0", "0" ], [ "1", "0", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "0", "1", "0" ], [ "1", "0", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "1", "0", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "0", "1", "0" ], [ "0", "0", "1", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "0", "0", "1" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "0", "0", "0", "1", "0" ], [ "1", "0", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "0", "1", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "1", "0", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ] ] ] }, { "name": "Population", "index": "1", "type": "numeric", "distinct": "56", "missing": "1", "min": "506875", "max": "17953372", "mean": "2315386", "stdev": "3137985" }, { "name": "Per_capita_income", "index": "2", "type": "numeric", "distinct": "56", "missing": "0", "min": "10697", "max": "22003", "mean": "16570", "stdev": "2094" }, { "name": "Household_income", "index": "3", "type": "numeric", "distinct": "56", "missing": "0", "min": "42225", "max": "80087", "mean": "55241", "stdev": "8063" }, { "name": "Discretionary_income", "index": "4", "type": "numeric", "distinct": "55", "missing": "0", "min": "34133", "max": "58222", "mean": "44324", "stdev": "5398" }, { "name": "Publics_in_top_10", "index": "5", "type": "nominal", "distinct": "10", "missing": "0", "distr": [ [ "0", "1", "2", "3", "4", "5", "6", "7", "8", "9" ], [ [ "0", "5", "2", "3", "1" ], [ "0", "4", "0", "0", "0" ], [ "1", "2", "2", "0", "0" ], [ "2", "2", "4", "0", "0" ], [ "2", "7", "2", "1", "0" ], [ "1", "4", "2", "0", "0" ], [ "0", "5", "0", "1", "0" ], [ "0", "2", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ], [ "0", "1", "0", "0", "0" ] ] ] }, { "name": "Nonprofits_in_top_10", "index": "6", "type": "nominal", "distinct": "6", "missing": "0", "distr": [ [ "0", "1", "2", "3", "4", "5" ], [ [ "0", "5", "1", "1", "0" ], [ "4", "12", "1", "0", "0" ], [ "2", "11", "3", "1", "0" ], [ "0", "4", "5", "1", "1" ], [ "0", "1", "2", "0", "0" ], [ "0", "0", "0", "2", "0" ] ] ] }, { "name": "For_profits_in_top_10", "index": "7", "type": "nominal", "distinct": "9", "missing": "0", "distr": [ [ "1", "2", "3", "4", "5", "6", "7", "8", "9" ], [ [ "0", "3", "0", "0", "0" ], [ "0", "4", "1", "0", "0" ], [ "0", "5", "4", "1", "0" ], [ "3", "5", "3", "1", "0" ], [ "1", "8", "2", "2", "0" ], [ "1", "0", "0", "0", "0" ], [ "1", "7", "1", "1", "1" ], [ "0", "1", "0", "0", "0" ], [ "0", "0", "1", "0", "0" ] ] ] }, { "name": "Utilities_in_top_10", "index": "8", "type": "nominal", "distinct": "3", "missing": "0", "distr": [ [ "0", "1", "2" ], [ [ "5", "21", "8", "5", "1" ], [ "1", "11", "4", "0", "0" ], [ "0", "1", "0", "0", "0" ] ] ] }, { "name": "Region", "index": "9", "type": "nominal", "distinct": "4", "missing": "0", "distr": [ [ "Midwest", "Northeast", "South", "West" ], [ [ "2", "4", "4", "2", "0" ], [ "0", "4", "4", "3", "1" ], [ "4", "16", "2", "0", "0" ], [ "0", "9", "2", "0", "0" ] ] ] }, { "name": "State_capital", "index": "10", "type": "nominal", "distinct": "2", "missing": "0", "distr": [ [ "No", "Yes" ], [ [ "3", "23", "11", "4", "1" ], [ "3", "10", "1", "1", "0" ] ] ] } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }