{ "data_id": "40900", "name": "Satellite", "exact_name": "Satellite", "version": 1, "version_label": null, "description": "**Author**: Markus Goldstein \r\n**Source**: [Dataverse](http:\/\/www.madm.eu\/downloads https:\/\/dataverse.harvard.edu\/dataset.xhtml?persistentId=doi:10.7910\/DVN\/OPQMVF) \r\n**Please cite**: \r\n\r\nThe satellite dataset comprises of features extracted from satellite observations. In particular, each image was taken under four different light wavelength, two in visible light (green and red) and two infrared images. The task of the original dataset is to classify the image into the soil category of the observed region. \r\n\r\n### Classes\r\nWe defined the soil classes “red soil”, “gray soil”, “damp gray soil” and “very damp gray soil” as the normal class. From the semantically different classes “cotton crop” and “soil with vegetation stubble” anomalies are sampled. \r\n\r\nAfter merging the original training and test set into a single dataset, the resulting dataset contains 5,025 normal instances as well as 75 randomly sampled anomalies (1.49%) with 36 dimensions \r\n\r\n### Relevant Papers\r\n\r\nGoldstein, Markus, and Seiichi Uchida. A comparative evaluation of unsupervised anomaly detection algorithms for multivariate data." PloS one 11.4 (2016): e0152173 \r\n\r\nThis dataset is not the original dataset. The target variable 'Target' is relabeled into 'Normal' and 'Anomaly'", "format": "ARFF", "uploader": "Minh-Anh Le", "uploader_id": 3768, "visibility": "public", "creator": "\"Markus Goldstein\"", "contributor": null, "date": "2017-09-22 17:23:34", "update_comment": null, "last_update": "2017-09-22 17:23:34", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/16787463\/phpZrCzJR", "default_target_attribute": "Target", "row_id_attribute": null, "ignore_attribute": null, "runs": 2078, "suggest": { "input": [ "Satellite", "The satellite dataset comprises of features extracted from satellite observations. In particular, each image was taken under four different light wavelength, two in visible light (green and red) and two infrared images. The task of the original dataset is to classify the image into the soil category of the observed region. ### Classes We defined the soil classes “red soil”, “gray soil”, “damp gray soil” and “very damp gray soil” as the normal class " ], "weight": 5 }, "qualities": { "NumberOfInstances": 5100, "NumberOfFeatures": 37, "NumberOfClasses": 2, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 36, "NumberOfSymbolicFeatures": 1, "MinSkewnessOfNumericAtts": -0.4083627845537765, "PercentageOfSymbolicFeatures": 2.7027027027027026, "Quartile3MutualInformation": null, "MaxNominalAttDistinctValues": 2, "MinStdDevOfNumericAtts": 11.658746554511957, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 0.06649700827757384, "MaxSkewnessOfNumericAtts": 0.12114448900529776, "MinorityClassPercentage": 1.4705882352941175, "Quartile1KurtosisOfNumericAtts": -0.8833972649132604, "Quartile3StdDevOfNumericAtts": 15.731707267105959, "MaxStdDevOfNumericAtts": 16.218497602623724, "MinorityClassSize": 75, "Quartile1MeansOfNumericAtts": 74.66279411764697, "StdvNominalAttDistinctValues": 0, "MeanAttributeEntropy": null, "NumberOfBinaryFeatures": 1, "Quartile1MutualInformation": null, "MeanKurtosisOfNumericAtts": -0.4632046647796124, "Quartile1SkewnessOfNumericAtts": -0.3001765419655136, "MeanMeansOfNumericAtts": 85.71349128540305, "Quartile1StdDevOfNumericAtts": 12.346102059986409, "AutoCorrelation": 0.9998038831143361, "MeanMutualInformation": null, "MeanNoiseToSignalRatio": null, "Quartile2AttributeEntropy": null, "ClassEntropy": 0.11058084476988708, "MeanNominalAttDistinctValues": 2, "Quartile2KurtosisOfNumericAtts": -0.44361356574449506, "Dimensionality": 0.0072549019607843135, "MeanSkewnessOfNumericAtts": -0.1096173151401041, "Quartile2MeansOfNumericAtts": 85.34186274509807, "EquivalentNumberOfAtts": null, "MeanStdDevOfNumericAtts": 14.241442633248703, "Quartile2MutualInformation": null, "MajorityClassPercentage": 98.52941176470588, "MinAttributeEntropy": null, "Quartile2SkewnessOfNumericAtts": -0.09325273490947447, "MajorityClassSize": 5025, "MinKurtosisOfNumericAtts": -1.0003040613442957, "PercentageOfBinaryFeatures": 2.7027027027027026, "Quartile2StdDevOfNumericAtts": 14.657614038348763, "MaxAttributeEntropy": null, "MinMeansOfNumericAtts": 72.35764705882367, "PercentageOfInstancesWithMissingValues": 0, "Quartile3AttributeEntropy": null, "MaxKurtosisOfNumericAtts": 0.08103471866179213, "MinMutualInformation": null, "PercentageOfMissingValues": 0, "Quartile3KurtosisOfNumericAtts": -0.0932955601099793, "MaxMeansOfNumericAtts": 99.56862745098042, "MinNominalAttDistinctValues": 2, "PercentageOfNumericFeatures": 97.2972972972973, "Quartile3MeansOfNumericAtts": 97.14073529411766, "MaxMutualInformation": null }, "tags": [ { "tag": "Life Science", "uploader": "38960" }, { "tag": "Medicine", "uploader": "38960" }, { "tag": "study_293", "uploader": "0" }, { "tag": "study_270", "uploader": "0" }, { "tag": "study_271", "uploader": "0" } ], "features": [ { "name": "Target", "index": "36", "type": "nominal", "distinct": "2", "missing": "0", "target": "1", "distr": [ [ "Normal", "Anomaly" ], [ [ "5025", "0" ], [ "0", "75" ] ] ] }, { "name": "V1", "index": "0", "type": "numeric", "distinct": "49", "missing": "0", "min": "41", "max": "104", "mean": "73", "stdev": "12" }, { "name": "V2", "index": "1", "type": "numeric", "distinct": "81", "missing": "0", "min": "28", "max": "137", "mean": "92", "stdev": "16" }, { "name": "V3", "index": "2", "type": "numeric", "distinct": "69", "missing": "0", "min": "62", "max": "139", "mean": "100", "stdev": "16" }, { "name": "V4", "index": "3", "type": "numeric", "distinct": "78", "missing": "0", "min": "44", "max": "144", "mean": "80", "stdev": "14" }, { "name": "V5", "index": "4", "type": "numeric", "distinct": "48", "missing": "0", "min": "42", "max": "104", "mean": "73", "stdev": "12" }, { "name": "V6", "index": "5", "type": "numeric", "distinct": "76", "missing": "0", "min": "29", "max": "137", "mean": "91", "stdev": "16" }, { "name": "V7", "index": "6", "type": "numeric", "distinct": "68", "missing": "0", "min": "62", "max": "139", "mean": "99", "stdev": "16" }, { "name": "V8", "index": "7", "type": "numeric", "distinct": "76", "missing": "0", "min": "46", "max": "157", "mean": "80", "stdev": "13" }, { "name": "V9", "index": "8", "type": "numeric", "distinct": "47", "missing": "0", "min": "42", "max": "104", "mean": "73", "stdev": "12" }, { "name": "V10", "index": "9", "type": "numeric", "distinct": "77", "missing": "0", "min": "29", "max": "130", "mean": "91", "stdev": "16" }, { "name": "V11", "index": "10", "type": "numeric", "distinct": "69", "missing": "0", "min": "60", "max": "140", "mean": "99", "stdev": "16" }, { "name": "V12", "index": "11", "type": "numeric", "distinct": "81", "missing": "0", "min": "34", "max": "150", "mean": "79", "stdev": "14" }, { "name": "V13", "index": "12", "type": "numeric", "distinct": "49", "missing": "0", "min": "41", "max": "104", "mean": "73", "stdev": "12" }, { "name": "V14", "index": "13", "type": "numeric", "distinct": "77", "missing": "0", "min": "27", "max": "137", "mean": "92", "stdev": "16" }, { "name": "V15", "index": "14", "type": "numeric", "distinct": "67", "missing": "0", "min": "62", "max": "139", "mean": "99", "stdev": "16" }, { "name": "V16", "index": "15", "type": "numeric", "distinct": "73", "missing": "0", "min": "44", "max": "150", "mean": "80", "stdev": "14" }, { "name": "V17", "index": "16", "type": "numeric", "distinct": "49", "missing": "0", "min": "41", "max": "104", "mean": "73", "stdev": "12" }, { "name": "V18", "index": "17", "type": "numeric", "distinct": "72", "missing": "0", "min": "27", "max": "130", "mean": "92", "stdev": "16" }, { "name": "V19", "index": "18", "type": "numeric", "distinct": "67", "missing": "0", "min": "62", "max": "139", "mean": "99", "stdev": "16" }, { "name": "V20", "index": "19", "type": "numeric", "distinct": "75", "missing": "0", "min": "44", "max": "146", "mean": "80", "stdev": "14" }, { "name": "V21", "index": "20", "type": "numeric", "distinct": "47", "missing": "0", "min": "42", "max": "104", "mean": "73", "stdev": "12" }, { "name": "V22", "index": "21", "type": "numeric", "distinct": "73", "missing": "0", "min": "29", "max": "130", "mean": "91", "stdev": "16" }, { "name": "V23", "index": "22", "type": "numeric", "distinct": "69", "missing": "0", "min": "60", "max": "138", "mean": "99", "stdev": "16" }, { "name": "V24", "index": "23", "type": "numeric", "distinct": "84", "missing": "0", "min": "34", "max": "150", "mean": "79", "stdev": "14" }, { "name": "V25", "index": "24", "type": "numeric", "distinct": "49", "missing": "0", "min": "40", "max": "104", "mean": "73", "stdev": "12" }, { "name": "V26", "index": "25", "type": "numeric", "distinct": "78", "missing": "0", "min": "27", "max": "131", "mean": "91", "stdev": "16" }, { "name": "V27", "index": "26", "type": "numeric", "distinct": "69", "missing": "0", "min": "60", "max": "139", "mean": "99", "stdev": "16" }, { "name": "V28", "index": "27", "type": "numeric", "distinct": "78", "missing": "0", "min": "44", "max": "151", "mean": "80", "stdev": "14" }, { "name": "V29", "index": "28", "type": "numeric", "distinct": "48", "missing": "0", "min": "41", "max": "104", "mean": "73", "stdev": "12" }, { "name": "V30", "index": "29", "type": "numeric", "distinct": "78", "missing": "0", "min": "27", "max": "130", "mean": "91", "stdev": "16" }, { "name": "V31", "index": "30", "type": "numeric", "distinct": "68", "missing": "0", "min": "62", "max": "139", "mean": "99", "stdev": "16" }, { "name": "V32", "index": "31", "type": "numeric", "distinct": "78", "missing": "0", "min": "42", "max": "151", "mean": "80", "stdev": "14" }, { "name": "V33", "index": "32", "type": "numeric", "distinct": "49", "missing": "0", "min": "40", "max": "104", "mean": "72", "stdev": "12" }, { "name": "V34", "index": "33", "type": "numeric", "distinct": "76", "missing": "0", "min": "27", "max": "130", "mean": "91", "stdev": "16" }, { "name": "V35", "index": "34", "type": "numeric", "distinct": "70", "missing": "0", "min": "50", "max": "138", "mean": "99", "stdev": "16" }, { "name": "V36", "index": "35", "type": "numeric", "distinct": "80", "missing": "0", "min": "29", "max": "147", "mean": "79", "stdev": "14" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 3, "nr_of_downloads": 70, "total_downloads": 133, "reach": 73, "reuse": 16, "impact_of_reuse": 0, "reach_of_reuse": 37, "impact": 34 }