{ "data_id": "1168", "name": "electricity_prices_ICON", "exact_name": "electricity_prices_ICON", "version": 1, "version_label": null, "description": "**Author**: H. Simonis, B. O\u2019Sullivan, D. Mehta, B. Hurley, M. De Cauwer \n**Source**: [ICON Challenge](http:\/\/iconchallenge.insight-centre.org\/) - 2014 \n**Please cite**: \n\n**ICON Challenge on Forecasting and Scheduling** \nWe consider the following problem: You are running a cloud computing service, where customers contract to run computing services (tasks). Each task has a duration, an earliest start and latest end, and resource requirements for CPU, Memory and I\/O attributes. The tasks can be scheduled on one of multiple servers, each server has a limited capacity for the CPU, memory and I\/O attributes. Multiple tasks can run concurrently on the same machine if the total resource consumption for all attributes is below the respective capacity. All tasks must be scheduled within their release and due dates, these dates are set so that no task stretches over midnight between two days. Tasks can not be interrupted, once started, they must run for their given duration. If a machine is used by a task, it must be running at that time. In addition to the cost of running the allocated tasks, the machine consumes some idle power if it is on. Every time a machine is switched on or off, a start-up resp. shut-down cost must be paid. All machines are off at the beginning of the planning period, all machines must be off at the end of the planning period.\n\nThe price of electricity for the data centre is a real-time price, and varies throughout the day. The actual price is not known in advance, a forecast must be used to generate a schedule. The total cost of the schedule is determined after the fact by applying the actual price of electricity to the energy consumption in each time period. One forecast of the price is given by the organizers. However there may be a large discrepancy between the forecast and actual price, offering the opportunity to generate better forecasts based on historical data for demand and prices, and previous forecast information. Note that a forecast with a low error is not automatically guaranteed to lead to a schedule with a low overall cost.\n\ufffc\ufffc\ufffc\ufffc\ufffc\ufffc\ufffc\nIn the forecast problem, we have to predict the actual electricity price for one day into the future based on historical and forecasted data. The historical data is available from September 2011 onwards. Missing values are marked with ?. The following fields are defined:\n>\n**DateTime** String, defines date and time of sample \n**Holiday** String, gives name of holiday if day is a bank holiday \n**HolidayFlag** integer, 1 if day is a bank holiday, zero otherwise \n**DayOfWeek** integer (0-6), 0 monday, day of week \n**WeekOfYear** integer, running week within year of this date \n**Day** integer, day of the date \n**Month** integer, month of the date \n**Year** integer, year of the date \n**PeriodOfDay** integer, denotes half hour period of day (0-47) \n**ForecastWindProduction** the forecasted wind production for this period \n**SystemLoadEA** the national load forecast for this period \n**SMPEA** the price forecast for this period \n**ORKTemperature** the actual temperature measured at Cork airport \n**ORKWindspeed** the actual windspeed measured at Cork airport \n**CO2Intensity** the actual CO2 intensity in (g\/kWh) for the electricity produced \n**ActualWindProduction** the actual wind energy production for this period \n**SystemLoadEP2** the actual national system load for this period \n**SMPEP2** the actual price of this time period, the value to be forecasted \n\nThe last four fields are only available for historical data, i.e. they can not be used to make the forecast.", "format": "ARFF", "uploader": "Joaquin Vanschoren", "uploader_id": 2, "visibility": "public", "creator": null, "contributor": null, "date": "2014-10-09 23:59:24", "update_comment": "added ignore feature", "last_update": "2014-10-10 00:34:30", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/66377\/phphy7RZ7", "default_target_attribute": "SMPEP2", "row_id_attribute": null, "ignore_attribute": "\"DateTime\"", "runs": 0, "suggest": { "input": [ "electricity_prices_ICON", "We consider the following problem: You are running a cloud computing service, where customers contract to run computing services (tasks). Each task has a duration, an earliest start and latest end, and resource requirements for CPU, Memory and I\/O attributes. The tasks can be scheduled on one of multiple servers, each server has a limited capacity for the CPU, memory and I\/O attributes. Multiple tasks can run concurrently on the same machine if the total resource consumption for all attributes i " ], "weight": 5 }, "qualities": [], "tags": [ { "uploader": "38960", "tag": "Chemistry" }, { "uploader": "38960", "tag": "Life Science" } ], "features": [ { "name": "SMPEP2", "index": "17", "type": "numeric", "distinct": "7813", "missing": "2", "target": "1", "min": "-48", "max": "1000", "mean": "64", "stdev": "35" }, { "name": "DateTime", "index": "0", "type": "string", "distinct": "38014", "missing": "0", "ignore": "1" }, { "name": "Holiday", "index": "1", "type": "nominal", "distinct": "15", "missing": "0", "distr": [] }, { "name": "HolidayFlag", "index": "2", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "DayOfWeek", "index": "3", "type": "numeric", "distinct": "7", "missing": "0", "min": "0", "max": "6", "mean": "3", "stdev": "2" }, { "name": "WeekOfYear", "index": "4", "type": "numeric", "distinct": "52", "missing": "0", "min": "1", "max": "52", "mean": "28", "stdev": "16" }, { "name": "Day", "index": "5", "type": "numeric", "distinct": "31", "missing": "0", "min": "1", "max": "31", "mean": "16", "stdev": "9" }, { "name": "Month", "index": "6", "type": "numeric", "distinct": "12", "missing": "0", "min": "1", "max": "12", "mean": "7", "stdev": "4" }, { "name": "Year", "index": "7", "type": "numeric", "distinct": "3", "missing": "0", "min": "2011", "max": "2013", "mean": "2012", "stdev": "1" }, { "name": "PeriodOfDay", "index": "8", "type": "numeric", "distinct": "48", "missing": "0", "min": "0", "max": "47", "mean": "24", "stdev": "14" }, { "name": "ForecastWindProduction", "index": "9", "type": "numeric", "distinct": "27475", "missing": "5", "min": "1", "max": "1680", "mean": "544", "stdev": "414" }, { "name": "SystemLoadEA", "index": "10", "type": "numeric", "distinct": "35584", "missing": "2", "min": "2184", "max": "6493", "mean": "4020", "stdev": "860" }, { "name": "SMPEA", "index": "11", "type": "numeric", "distinct": "7339", "missing": "2", "min": "0", "max": "588", "mean": "63", "stdev": "32" }, { "name": "ORKTemperature", "index": "12", "type": "numeric", "distinct": "31", "missing": "295", "min": "-4", "max": "25", "mean": "10", "stdev": "4" }, { "name": "ORKWindspeed", "index": "13", "type": "numeric", "distinct": "52", "missing": "299", "min": "0", "max": "76", "mean": "19", "stdev": "10" }, { "name": "CO2Intensity", "index": "14", "type": "numeric", "distinct": "22458", "missing": "7", "min": "0", "max": "843", "mean": "479", "stdev": "85" }, { "name": "ActualWindProduction", "index": "15", "type": "numeric", "distinct": "1535", "missing": "5", "min": "1", "max": "1769", "mean": "521", "stdev": "378" }, { "name": "SystemLoadEP2", "index": "16", "type": "numeric", "distinct": "35653", "missing": "2", "min": "1810", "max": "6310", "mean": "3786", "stdev": "843" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }