{ "data_id": "43377", "name": "Pulsar-Dataset-HTRU2", "exact_name": "Pulsar-Dataset-HTRU2", "version": 1, "version_label": "v1.0", "description": "Description:\nPulsars are a rare type of Neutron star that produce radio emission detectable here on Earth. They are of considerable scientific interest as probes of space-time, the interstellar medium, and states of matter. Machine learning tools are now being used to automatically label pulsar candidates to facilitate rapid analysis. In particular, classification systems are widely adopted, which treat the candidate data sets as binary classification problems.\nAttribute information:\nEach candidate is described by 8 continuous variables and a single class variable. The first four are simple statistics obtained from the integrated pulse profile (folded profile). This is an array of continuous variables that describe a longitude-resolved version of the signal that has been averaged in both time and frequency. The remaining four variables are similarly obtained from the DM-SNR curve. These are summarised below:\n1. Mean of the integrated profile.\n2. Standard deviation of the integrated profile.\n3. Excess kurtosis of the integrated profile.\n4. Skewness of the integrated profile.\n5. Mean of the DM-SNR curve.\n6. Standard deviation of the DM-SNR curve.\n7. Excess kurtosis of the DM-SNR curve.\n8. Skewness of the DM-SNR curve.\n9. Class\n\nDescriptions courtesy of Ustav Murarka:\n\nIntegrated Pulse Profile: Each pulsar produces a unique pattern of pulse emission known as its pulse profile. It is like a fingerprint of the pulsar. It is possible to identify pulsars from their pulse profile alone. But the pulse profile varies slightly in every period. This makes the pulsar hard to detect. This is because their signals are non-uniform and not entirely stable overtime. However, these profiles do become stable, when averaged over many thousands of rotations.\nDM-SNR Curve: Radio waves emitted from pulsars reach earth after traveling long distances in space which is filled with free electrons. Since radio waves are electromagnetic in nature, they interact with these electrons, this interaction results in slowing down of the wave. The important point is that pulsars emit a wide range of frequencies, and the amount by which the electrons slow down the wave depends on the frequency. Waves with higher frequency are sowed down less as compared to waves with higher frequency. i.e. lower frequencies reach the telescope later than higher frequencies. This is called dispersion.\nDataset Summary:\n17,898 total examples.\n1,639 positive examples.\n16,259 negative examples.\n\nExample\nExample from Prof. Anna Scaife at the University of Manchester, UK- https:\/\/as595.github.io\/classification\/\nSource: (https:\/\/archive.ics.uci.edu\/ml\/datasets\/HTRU2)\nDr. Robert Lyon\nUniversity of Manchester\nSchool of Physics and Astronomy\nAlan Turing Building\nManchester M13 9PL\nUnited Kingdom\nrobert.lyon '' manchester.ac.uk\n\n-", "format": "arff", "uploader": "Elif Ceren Gok", "uploader_id": 30125, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-23 12:44:09", "update_comment": null, "last_update": "2022-03-23 12:44:09", "licence": "CC BY-NC-SA 4.0", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102202\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Pulsar-Dataset-HTRU2", "Description: Pulsars are a rare type of Neutron star that produce radio emission detectable here on Earth. They are of considerable scientific interest as probes of space-time, the interstellar medium, and states of matter. Machine learning tools are now being used to automatically label pulsar candidates to facilitate rapid analysis. In particular, classification systems are widely adopted, which treat the candidate data sets as binary classification problems. Attribute information: Each candid " ], "weight": 5 }, "qualities": { "NumberOfInstances": 17897, "NumberOfFeatures": 9, "NumberOfClasses": null, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 9, "NumberOfSymbolicFeatures": 0, "Dimensionality": 0.0005028775772475834, "PercentageOfNumericFeatures": 100, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "AutoCorrelation": null, "PercentageOfMissingValues": 0 }, "tags": [ { "uploader": "38960", "tag": "Machine Learning" }, { "uploader": "38960", "tag": "Manufacturing" } ], "features": [ { "name": "140.5625", "index": "0", "type": "numeric", "distinct": "8625", "missing": "0", "min": "6", "max": "193", "mean": "111", "stdev": "26" }, { "name": "55.68378214", "index": "1", "type": "numeric", "distinct": "17861", "missing": "0", "min": "25", "max": "99", "mean": "47", "stdev": "7" }, { "name": "-0.234571412", "index": "2", "type": "numeric", "distinct": "17896", "missing": "0", "min": "-2", "max": "8", "mean": "0", "stdev": "1" }, { "name": "-0.699648398", "index": "3", "type": "numeric", "distinct": "17897", "missing": "0", "min": "-2", "max": "68", "mean": "2", "stdev": "6" }, { "name": "3.199832776", "index": "4", "type": "numeric", "distinct": "9000", "missing": "0", "min": "0", "max": "223", "mean": "13", "stdev": "29" }, { "name": "19.11042633", "index": "5", "type": "numeric", "distinct": "17893", "missing": "0", "min": "7", "max": "111", "mean": "26", "stdev": "19" }, { "name": "7.975531794", "index": "6", "type": "numeric", "distinct": "17894", "missing": "0", "min": "-3", "max": "35", "mean": "8", "stdev": "5" }, { "name": "74.24222492", "index": "7", "type": "numeric", "distinct": "17894", "missing": "0", "min": "-2", "max": "1191", "mean": "105", "stdev": "107" }, { "name": "0", "index": "8", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }