{ "data_id": "354", "name": "poker", "exact_name": "poker", "version": 1, "version_label": null, "description": "**Author**: UCI \n**Source**: [original](http:\/\/www.csie.ntu.edu.tw\/~cjlin\/libsvmtools\/datasets) - \n**Please cite**: \n\nThis is the poker dataset, retrieved 2013-11-14 from the libSVM site. Additional to the preprocessing done there (see LibSVM site for details), this dataset was created as follows: \n\n-join test and train datasets (non-scaled versions) \n-relabel classes 0=positive class and 1,2,...9=negative class \n-normalize each file columnwise according to the following rules: \n-If a column only contains one value (constant feature), it will set to zero and thus removed by sparsity. \n-If a column contains two values (binary feature), the value occuring more often will be set to zero, the other to one. \n-If a column contains more than two values (multinary\/real feature), the column is divided by its std deviation. \n\nNOTE: please keep in mind that poker has a mild redundancy, e.g. some duplicated data points, roughly 0.2%, within each file (train,test). these duplicated points have not been removed!\n", "format": "Sparse_ARFF", "uploader": "aydin demircioglu", "uploader_id": 167, "visibility": "public", "creator": "\"UCI\"", "contributor": null, "date": "2014-08-29 19:20:49", "update_comment": null, "last_update": "2014-08-29 19:20:49", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/52257\/phpQfR7GF", "default_target_attribute": "Y", "row_id_attribute": null, "ignore_attribute": null, "runs": 23, "suggest": { "input": [ "poker", "This is the poker dataset, retrieved 2013-11-14 from the libSVM site. Additional to the preprocessing done there (see LibSVM site for details), this dataset was created as follows: -join test and train datasets (non-scaled versions) -relabel classes 0=positive class and 1,2,...9=negative class -normalize each file columnwise according to the following rules: -If a column only contains one value (constant feature), it will set to zero and thus removed by sparsity. -If a column contains two values " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1025010, "NumberOfFeatures": 11, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 10, "NumberOfSymbolicFeatures": 1, "Quartile2KurtosisOfNumericAtts": -1.2869179105888708, "REPTreeDepth2Kappa": 0.44457831635167633, "ClassEntropy": 0.999996065069868, "kNN1NKappa": 0.15110985818195694, "MajorityClassSize": 513702, "MinAttributeEntropy": null, "Quartile2MeansOfNumericAtts": 2.0525138589969862, "REPTreeDepth3AUC": 0.7921387830234807, "DecisionStumpAUC": 0.501351392863736, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.3620784913025086, "Quartile2MutualInformation": null, "REPTreeDepth3ErrRate": 0.2776382669437371, "DecisionStumpErrRate": 0.49893659574052934, "MaxKurtosisOfNumericAtts": -1.2139443053241539, "MinMeansOfNumericAtts": 1.8687027823168558, "Quartile2SkewnessOfNumericAtts": -0.0004426365875057511, "REPTreeDepth3Kappa": 0.44457831635167633, "DecisionStumpKappa": 0.0014085134775763887, "MaxMeansOfNumericAtts": 2.237961613767665, "MinMutualInformation": null, "PercentageOfBinaryFeatures": 9.090909090909092, "Quartile2StdDevOfNumericAtts": 0.9999999978451746, "RandomTreeDepth1AUC": 0.675690658008867, "Dimensionality": 1.0731602618511039e-5, "MaxMutualInformation": null, "MinNominalAttDistinctValues": 2, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "RandomTreeDepth1ErrRate": 0.32431195793211776, "EquivalentNumberOfAtts": null, "MaxNominalAttDistinctValues": 2, "MinSkewnessOfNumericAtts": -0.0023343750671693743, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": -1.214133977037437, "AutoCorrelation": 0.4999243909077872, "RandomTreeDepth1Kappa": 0.35137778673423214, "J48.00001.AUC": 0.8256239656337289, "MaxSkewnessOfNumericAtts": 0.003976438996103179, "MinStdDevOfNumericAtts": 0.9999998332766981, "PercentageOfNumericFeatures": 90.9090909090909, "Quartile3MeansOfNumericAtts": 2.2366421272185173, "CfsSubsetEval_DecisionStumpAUC": 0.5, "RandomTreeDepth2AUC": 0.675690658008867, "J48.00001.ErrRate": 0.23210993063482308, "MaxStdDevOfNumericAtts": 1.000000059360445, "MinorityClassPercentage": 49.88322065150584, "PercentageOfSymbolicFeatures": 9.090909090909092, "Quartile3MutualInformation": null, "CfsSubsetEval_DecisionStumpErrRate": 0.4988322065150584, "RandomTreeDepth2ErrRate": 0.32431195793211776, "J48.00001.Kappa": 0.5356154784837265, "MeanAttributeEntropy": null, "MinorityClassSize": 511308, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 0.00036009808207030454, "CfsSubsetEval_DecisionStumpKappa": 0, "RandomTreeDepth2Kappa": 0.35137778673423214, "J48.0001.AUC": 0.8256239656337289, "MeanKurtosisOfNumericAtts": -1.287483723946719, "NaiveBayesAUC": 0.5055055063242602, "Quartile1KurtosisOfNumericAtts": -1.3608804059534425, "Quartile3StdDevOfNumericAtts": 1.0000000337491475, "CfsSubsetEval_NaiveBayesAUC": 0.5, "RandomTreeDepth3AUC": 0.675690658008867, "J48.0001.ErrRate": 0.23210993063482308, "MeanMeansOfNumericAtts": 2.0531072186889205, "NaiveBayesErrRate": 0.49009960878430453, "Quartile1MeansOfNumericAtts": 1.8701857898038323, "REPTreeDepth1AUC": 0.7921387830234807, "CfsSubsetEval_NaiveBayesErrRate": 0.4988322065150584, "RandomTreeDepth3ErrRate": 0.32431195793211776, "J48.0001.Kappa": 0.5356154784837265, "MeanMutualInformation": null, "NaiveBayesKappa": 0.0191603021069954, "Quartile1MutualInformation": null, "REPTreeDepth1ErrRate": 0.2776382669437371, "CfsSubsetEval_NaiveBayesKappa": 0, "RandomTreeDepth3Kappa": 0.35137778673423214, "J48.001.AUC": 0.8256239656337289, "MeanNoiseToSignalRatio": null, "NumberOfBinaryFeatures": 1, "Quartile1SkewnessOfNumericAtts": -0.0017526464580151736, "REPTreeDepth1Kappa": 0.44457831635167633, "CfsSubsetEval_kNN1NAUC": 0.5, "StdvNominalAttDistinctValues": 0, "J48.001.ErrRate": 0.23210993063482308, "MeanNominalAttDistinctValues": 2, "Quartile1StdDevOfNumericAtts": 0.9999998878001628, "REPTreeDepth2AUC": 0.7921387830234807, "CfsSubsetEval_kNN1NErrRate": 0.4988322065150584, "kNN1NAUC": 0.5755774139921012, "J48.001.Kappa": 0.5356154784837265, "MeanSkewnessOfNumericAtts": -0.0002357688070950237, "Quartile2AttributeEntropy": null, "REPTreeDepth2ErrRate": 0.2776382669437371, "CfsSubsetEval_kNN1NKappa": 0, "kNN1NErrRate": 0.4244446395644921, "MajorityClassPercentage": 50.116779348494155, "MeanStdDevOfNumericAtts": 0.9999999633279619 }, "tags": [ { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "Y", "index": "0", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "1", "-1" ], [ [ "513702", "0" ], [ "0", "511308" ] ] ] }, { "name": "X1", "index": "1", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "2", "stdev": "1" }, { "name": "X2", "index": "2", "type": "numeric", "distinct": "13", "missing": "0", "min": "0", "max": "3", "mean": "2", "stdev": "1" }, { "name": "X3", "index": "3", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "2", "stdev": "1" }, { "name": "X4", "index": "4", "type": "numeric", "distinct": "13", "missing": "0", "min": "0", "max": "3", "mean": "2", "stdev": "1" }, { "name": "X5", "index": "5", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "2", "stdev": "1" }, { "name": "X6", "index": "6", "type": "numeric", "distinct": "13", "missing": "0", "min": "0", "max": "3", "mean": "2", "stdev": "1" }, { "name": "X7", "index": "7", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "2", "stdev": "1" }, { "name": "X8", "index": "8", "type": "numeric", "distinct": "13", "missing": "0", "min": "0", "max": "3", "mean": "2", "stdev": "1" }, { "name": "X9", "index": "9", "type": "numeric", "distinct": "4", "missing": "0", "min": "1", "max": "4", "mean": "2", "stdev": "1" }, { "name": "X10", "index": "10", "type": "numeric", "distinct": "13", "missing": "0", "min": "0", "max": "3", "mean": "2", "stdev": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }