{ "data_id": "673", "name": "chscase_census2", "exact_name": "chscase_census2", "version": 1, "version_label": null, "description": "**Author**: \n**Source**: Unknown - Date unknown \n**Please cite**: \n\nFile README\n-----------\n\nchscase A collection of the data sets used in the book\n\"A Casebook for a First Course in Statistics and Data Analysis,\"\nby Samprit Chatterjee, Mark S. Handcock and Jeffrey S. Simonoff,\nJohn Wiley and Sons, New York, 1995. Submitted by\nSamprit Chatterjee (schatterjee@stern.nyu.edu),\nMark Handcock (mhandcock@stern.nyu.edu) and\nJeff Simonoff (jsimonoff@stern.nyu.edu)\n\nThis submission consists of 38 files, plus this README file.\nEach file represents a data set analyzed in the book. The names\nof the files correspond to the names used in the book. The data\nfiles are written in plain ASCII (character) text. Missing\nvalues are represented by \"M\" in all data files.\n\nMore information about the data sets and the book can be\nobtained via gopher at the address\nswis.stern.nyu.edu\n\nThe information is filed under\n---> Academic Departments & Research Centers\n---> Statistics and Operations Research\n---> Publications\n---> A Casebook for a First Course in Statistics and Data Analysis\n---> Welcome!\n\nIt can also be accessed from the World Wide Web (WWW) using a\nWWW browser (e.g., netscape) starting from the URL address\nhttp:\/\/www.stern.nyu.edu\/SOR\/Casebook\n\n\n\nNOTICE: These datasets may be used freely for scientific,\neducational and\/or non-commercial purposes, provided suitable\nacknowledgment is given (by citing the Chatterjee, Handcock and\nSimonoff reference above).\n\nFile: census2.dat\n\nNote: attribute names were generated automatically since there was no\ninformation in the data itself.\n\n\nInformation about the dataset\nCLASSTYPE: numeric\nCLASSINDEX: none specific", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": "Samprit Chatterjee, Mark S. Handcock, Jeffrey S. Simonoff", "contributor": null, "date": "2014-10-04 13:54:06", "update_comment": "fixed arff file (missing value characters)", "last_update": "2015-04-15 22:17:36", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/1390073\/phpaGFJfu", "kaggle_url": null, "default_target_attribute": "col_8", "row_id_attribute": null, "ignore_attribute": null, "runs": 22, "suggest": { "input": [ "chscase_census2", "File README ----------- chscase A collection of the data sets used in the book \"A Casebook for a First Course in Statistics and Data Analysis,\" by Samprit Chatterjee, Mark S. Handcock and Jeffrey S. Simonoff, John Wiley and Sons, New York, 1995. Submitted by Samprit Chatterjee (schatterjee@stern.nyu.edu), Mark Handcock (mhandcock@stern.nyu.edu) and Jeff Simonoff (jsimonoff@stern.nyu.edu) This submission consists of 38 files, plus this README file. Each file represents a data set analyzed in the " ], "weight": 5 }, "qualities": { "NumberOfInstances": 400, "NumberOfFeatures": 8, "NumberOfClasses": 0, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 8, "NumberOfSymbolicFeatures": 0, "MaxMutualInformation": null, "MinNominalAttDistinctValues": null, "PercentageOfBinaryFeatures": 0, "Quartile2StdDevOfNumericAtts": 3.27296640071453, "RandomTreeDepth1AUC": null, "Dimensionality": 0.02, "MaxNominalAttDistinctValues": null, "MinSkewnessOfNumericAtts": 0.10175154033937105, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "RandomTreeDepth1ErrRate": null, "EquivalentNumberOfAtts": null, "MaxSkewnessOfNumericAtts": 2.68073920034646, "MinStdDevOfNumericAtts": 0.5035223014874697, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": 8.535801452534248, "AutoCorrelation": 0.43266716791979976, "RandomTreeDepth1Kappa": null, "J48.00001.AUC": null, "MaxStdDevOfNumericAtts": 12.92188785565907, "MinorityClassPercentage": null, "PercentageOfNumericFeatures": 100, "Quartile3MeansOfNumericAtts": 20.2421865625, "CfsSubsetEval_DecisionStumpAUC": null, "RandomTreeDepth2AUC": null, "J48.00001.ErrRate": null, "MeanAttributeEntropy": null, "MinorityClassSize": null, "PercentageOfSymbolicFeatures": 0, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": null, "RandomTreeDepth2ErrRate": null, "J48.00001.Kappa": null, "MeanKurtosisOfNumericAtts": 4.023913191627579, "NaiveBayesAUC": null, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 2.043147869405944, "CfsSubsetEval_DecisionStumpKappa": null, "RandomTreeDepth2Kappa": null, "J48.0001.AUC": null, "MeanMeansOfNumericAtts": 19.96079809375, "NaiveBayesErrRate": null, "Quartile1KurtosisOfNumericAtts": 0.5104441233804474, "Quartile3StdDevOfNumericAtts": 8.011812882967877, "CfsSubsetEval_NaiveBayesAUC": null, "RandomTreeDepth3AUC": null, "J48.0001.ErrRate": null, "MeanMutualInformation": null, "NaiveBayesKappa": null, "Quartile1MeansOfNumericAtts": 19.7683659375, "REPTreeDepth1AUC": null, "CfsSubsetEval_NaiveBayesErrRate": null, "RandomTreeDepth3ErrRate": null, "J48.0001.Kappa": null, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 0, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": null, "CfsSubsetEval_NaiveBayesKappa": null, "RandomTreeDepth3Kappa": null, "J48.001.AUC": null, "MeanNominalAttDistinctValues": null, "Quartile1SkewnessOfNumericAtts": 0.49955676313552755, "REPTreeDepth1Kappa": null, "CfsSubsetEval_kNN1NAUC": null, "StdvNominalAttDistinctValues": null, "J48.001.ErrRate": null, "J48.001.Kappa": null, "MeanSkewnessOfNumericAtts": 1.1667261920200749, "Quartile1StdDevOfNumericAtts": 1.3073960733088805, "REPTreeDepth2AUC": null, "CfsSubsetEval_kNN1NErrRate": null, "kNN1NAUC": null, "MajorityClassPercentage": null, "MeanStdDevOfNumericAtts": 4.635876644060639, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": null, "CfsSubsetEval_kNN1NKappa": null, "kNN1NErrRate": null, "MajorityClassSize": null, "MinAttributeEntropy": null, "Quartile2KurtosisOfNumericAtts": 0.9580534837892727, "REPTreeDepth2Kappa": null, "ClassEntropy": null, "kNN1NKappa": null, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": 0.22678912420903918, "Quartile2MeansOfNumericAtts": 19.86353975, "REPTreeDepth3AUC": null, "DecisionStumpAUC": null, "MaxKurtosisOfNumericAtts": 12.822428414662593, "MinMeansOfNumericAtts": 19.39201725, "Quartile2MutualInformation": null, "REPTreeDepth3ErrRate": null, "DecisionStumpErrRate": null, "MaxMeansOfNumericAtts": 20.7305125, "MinMutualInformation": null, "Quartile2SkewnessOfNumericAtts": 0.7451018651105756, "REPTreeDepth3Kappa": null, "DecisionStumpKappa": null }, "tags": [ { "uploader": "38960", "tag": "Data Science" }, { "uploader": "38960", "tag": "Education" }, { "uploader": "24659", "tag": "StatLib" } ], "topics": [ { "topic": "Book-based", "uploader": "8111" } ], "features": [ { "name": "col_8", "index": "7", "type": "numeric", "distinct": "397", "missing": "0", "target": "1", "min": "18", "max": "22", "mean": "20", "stdev": "1" }, { "name": "col_1", "index": "0", "type": "numeric", "distinct": "379", "missing": "0", "min": "0", "max": "115", "mean": "21", "stdev": "13" }, { "name": "col_2", "index": "1", "type": "numeric", "distinct": "397", "missing": "0", "min": "7", "max": "78", "mean": "20", "stdev": "9" }, { "name": "col_3", "index": "2", "type": "numeric", "distinct": "398", "missing": "0", "min": "8", "max": "41", "mean": "19", "stdev": "5" }, { "name": "col_4", "index": "3", "type": "numeric", "distinct": "399", "missing": "0", "min": "12", "max": "47", "mean": "20", "stdev": "4" }, { "name": "col_5", "index": "4", "type": "numeric", "distinct": "398", "missing": "0", "min": "14", "max": "27", "mean": "20", "stdev": "2" }, { "name": "col_6", "index": "5", "type": "numeric", "distinct": "400", "missing": "0", "min": "16", "max": "26", "mean": "20", "stdev": "2" }, { "name": "col_7", "index": "6", "type": "numeric", "distinct": "397", "missing": "0", "min": "17", "max": "24", "mean": "20", "stdev": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }