{ "data_id": "46251", "name": "Solar-Power", "exact_name": "Solar-Power", "version": 1, "version_label": null, "description": "Solar power production in MW recorded per every 4 seconds starting from 01\/08\/2019 in Australia.\n\nFrom the website:\n-----\nThis dataset contains a single very long daily time series representing the solar power production in MW recorded per every 4 seconds starting from 01\/08\/2019. It was downloaded from the Australian Energy Market Operator (AEMO) online platform. The length of this time series is 7397222.\n\n-----\n\nHere is the dataset curated by the Monash Time Series Forecasting Repository. It is not clear which were the preprocessing steps and how did they\nacquired the data from the original website (https:\/\/aemo.com.au\/ and http:\/\/www.nemweb.com.au\/).\n\nThere are 4 columns:\n\nid_series: The id of the time series.\n\ndate: The date of the time series in the format \"%Y-%m-%d\".\n\ntime_step: The time step on the time series.\n\nvalue_0: The values of the time series, which will be used for the forecasting task.\n\nPreprocessing:\n\n1 - Renamed columns 'series_name' and 'series_value' to 'id_series' and 'value_0'.\n\n2 - Exploded the 'value' column.\n\n3 - Created 'time_step' column from the exploded data.\n\n4 - Cretead 'date' column from the 'start_timestamp' and 'time_step' column, by offseting the 'start_timestamp' by 4 secods * time_step.\n\n5 - Dropped 'start_timestamp' column. Defined 'id_series' as 'category' and casted 'value_0' to float.", "format": "arff", "uploader": "Bruno Belucci Teixeira", "uploader_id": 30703, "visibility": "public", "creator": "\"Godahewa, Rakshitha; Bergmeir, Christoph; Webb, Geoff; Abolghasemi, Mahdi; Hyndman, Rob; Montero-Manso, Pablo\"", "contributor": null, "date": "2024-06-25 01:03:00", "update_comment": null, "last_update": "2024-06-25 01:03:00", "licence": "Creative Commons Attribution 4.0 International", "status": "active", "error_message": null, "url": "https:\/\/api.openml.org\/data\/download\/22120715\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Solar-Power", "Solar power production in MW recorded per every 4 seconds starting from 01\/08\/2019 in Australia. From the website: ----- This dataset contains a single very long daily time series representing the solar power production in MW recorded per every 4 seconds starting from 01\/08\/2019. It was downloaded from the Australian Energy Market Operator (AEMO) online platform. The length of this time series is 7397222. ----- Here is the dataset curated by the Monash Time Series Forecasting Repository. It is n " ], "weight": 5 }, "qualities": { "NumberOfInstances": 7397222, "NumberOfFeatures": 4, "NumberOfClasses": null, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 2, "NumberOfSymbolicFeatures": 1, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "PercentageOfMissingValues": 0, "AutoCorrelation": null, "PercentageOfNumericFeatures": 50, "Dimensionality": 5.407435385878645e-7, "PercentageOfSymbolicFeatures": 25, "MajorityClassPercentage": null, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0 }, "tags": [], "features": [ { "name": "id_series", "index": "0", "type": "nominal", "distinct": "1", "missing": "0", "distr": [] }, { "name": "value_0", "index": "1", "type": "numeric", "distinct": "1147", "missing": "0", "min": "0", "max": "117", "mean": "33", "stdev": "43" }, { "name": "time_step", "index": "2", "type": "numeric", "distinct": "7397222", "missing": "0", "min": "0", "max": "7397221", "mean": "3698611", "stdev": "2135394" }, { "name": "date", "index": "3", "type": "string", "distinct": "7397222", "missing": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }