{ "data_id": "44142", "name": "Bike_Sharing_Demand", "exact_name": "Bike_Sharing_Demand", "version": 8, "version_label": "1", "description": "Dataset used in the tabular data benchmark https:\/\/github.com\/LeoGrin\/tabular-benchmark, transformed in the same way. This dataset belongs to the \"regression on numerical features\" benchmark. Original description: \n \nBike sharing systems are new generation of traditional bike rentals where whole process from membership, rental and return \nback has become automatic. Through these systems, user is able to easily rent a bike from a particular position and return \nback at another position. Currently, there are about over 500 bike-sharing programs around the world which is composed of \nover 500 thousands bicycles. Today, there exists great interest in these systems due to their important role in traffic, \nenvironmental and health issues. \n\nApart from interesting real world applications of bike sharing systems, the characteristics of data being generated by\nthese systems make them attractive for the research. Opposed to other transport services such as bus or subway, the duration\nof travel, departure and arrival position is explicitly recorded in these systems. This feature turns bike sharing system into\na virtual sensor network that can be used for sensing mobility in the city. Hence, it is expected that most of important\nevents in the city could be detected via monitoring these data.\n\nBike-sharing rental process is highly correlated to the environmental and seasonal settings. For instance, weather conditions,\nprecipitation, day of week, season, hour of the day, etc. can affect the rental behaviors. The core data set is related to \nthe two-year historical log corresponding to years 2011 and 2012 from Capital Bikeshare system, Washington D.C., USA which is \npublicly available in http:\/\/capitalbikeshare.com\/system-data. We aggregated the data on two hourly and daily basis and then \nextracted and added the corresponding weather and seasonal information. Weather information are extracted from http:\/\/www.freemeteo.com. \n\nUse of this dataset in publications must be cited to the following publication:\nFanaee-T, Hadi, and Gama, Joao, \"Event labeling combining ensemble detectors and background knowledge\", \nProgress in Artificial Intelligence (2013): pp. 1-15, Springer Berlin Heidelberg, doi:10.1007\/s13748-013-0040-3.\n\nAttributes:\n- season : season (1:springer, 2:summer, 3:fall, 4:winter)\n- yr : year (0: 2011, 1:2012)\n- mnth : month ( 1 to 12)\n- hr : hour (0 to 23)\n- holiday : weather day is holiday or not (extracted from http:\/\/dchr.dc.gov\/page\/holiday-schedule)\n- weekday : day of the week\n- workingday : if day is neither weekend nor holiday is 1, otherwise is 0.\n- weathersit : \n - 1: Clear, Few clouds, Partly cloudy, Partly cloudy\n - 2: Mist + Cloudy, Mist + Broken clouds, Mist + Few clouds, Mist\n - 3: Light Snow, Light Rain + Thunderstorm + Scattered clouds, Light Rain + Scattered clouds\n - 4: Heavy Rain + Ice Pallets + Thunderstorm + Mist, Snow + Fog\n- temp : Normalized temperature in Celsius. The values are divided to 41 (max)\n- atemp: Normalized feeling temperature in Celsius. The values are divided to 50 (max)\n- hum: Normalized humidity. The values are divided to 100 (max)\n- windspeed: Normalized wind speed. The values are divided to 67 (max)\n- casual: count of casual users\n- registered: count of registered users\n- cnt: count of total rental bikes including both casual and registered\n\nThis version was cleanup up by Joaquin Vanschoren:\n- Category labels replaced by category names (season, weathersit, year)\n- Turned back normalization for temperature and windspeed for interpretability\n- Renamed features for readability", "format": "arff", "uploader": "Leo Grin", "uploader_id": 26324, "visibility": "public", "creator": "\"Hadi Fanaee-T and Joao Gama\"", "contributor": "\"Leo Grin\"", "date": "2022-07-05 20:51:10", "update_comment": null, "last_update": "2022-07-05 20:51:10", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/api.openml.org\/data\/download\/22103267\/dataset", "default_target_attribute": "count", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Bike_Sharing_Demand", "Dataset used in the tabular data benchmark https:\/\/github.com\/LeoGrin\/tabular-benchmark, transformed in the same way. This dataset belongs to the \"regression on numerical features\" benchmark. Original description: Bike sharing systems are new generation of traditional bike rentals where whole process from membership, rental and return back has become automatic. Through these systems, user is able to easily rent a bike from a particular position and return back at another position. Currently, the " ], "weight": 5 }, "qualities": { "NumberOfInstances": 17379, "NumberOfFeatures": 7, "NumberOfClasses": 0, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 7, "NumberOfSymbolicFeatures": 0, "PercentageOfMissingValues": 0, "AutoCorrelation": -63.92513522844976, "PercentageOfNumericFeatures": 100, "Dimensionality": 0.0004027849703665343, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0 }, "tags": [ { "uploader": "38960", "tag": "Demographics" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "count", "index": "6", "type": "numeric", "distinct": "869", "missing": "0", "target": "1", "min": "1", "max": "977", "mean": "189", "stdev": "181" }, { "name": "month", "index": "0", "type": "numeric", "distinct": "12", "missing": "0", "min": "1", "max": "12", "mean": "7", "stdev": "3" }, { "name": "hour", "index": "1", "type": "numeric", "distinct": "24", "missing": "0", "min": "0", "max": "23", "mean": "12", "stdev": "7" }, { "name": "temp", "index": "2", "type": "numeric", "distinct": "50", "missing": "0", "min": "1", "max": "41", "mean": "20", "stdev": "8" }, { "name": "feel_temp", "index": "3", "type": "numeric", "distinct": "65", "missing": "0", "min": "0", "max": "50", "mean": "24", "stdev": "9" }, { "name": "humidity", "index": "4", "type": "numeric", "distinct": "89", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "windspeed", "index": "5", "type": "numeric", "distinct": "30", "missing": "0", "min": "0", "max": "57", "mean": "13", "stdev": "8" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }