{ "data_id": "43752", "name": "Crowdedness-at-the-Campus-Gym", "exact_name": "Crowdedness-at-the-Campus-Gym", "version": 1, "version_label": "v1.0", "description": "Background\nWhen is my university campus gym least crowded, so I know when to work out? We measured how many people were in this gym once every 10 minutes over the last year. We want to be able to predict how crowded the gym will be in the future.\nGoals\n\nGiven a time of day (and maybe some other features, including weather), predict how crowded the gym will be. \nFigure out which features are actually important, which are redundant, and what features could be added to make the predictions more accurate.\n\nData\nThe dataset consists of 26,000 people counts (about every 10 minutes) over the last year. In addition, I gathered extra info including weather and semester-specific information that might affect how crowded it is. The label is the number of people, which I'd like to predict given some subset of the features. \nLabel:\n\nNumber of people \n\nFeatures:\n\ndate (string; datetime of data)\ntimestamp (int; number of seconds since beginning of day)\ndayofweek (int; 0 [monday] - 6 [sunday])\nis_weekend (int; 0 or 1) [boolean, if 1, it's either saturday or sunday, otherwise 0]\nis_holiday (int; 0 or 1) [boolean, if 1 it's a federal holiday, 0 otherwise]\ntemperature (float; degrees fahrenheit)\nisstartof_semester (int; 0 or 1) [boolean, if 1 it's the beginning of a school semester, 0 otherwise]\nmonth (int; 1 [jan] - 12 [dec])\nhour (int; 0 - 23)\n\nAcknowledgements\nThis data was collected with the consent of the university and the gym in question.", "format": "arff", "uploader": "Dustin Carrion", "uploader_id": 30123, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-24 07:51:36", "update_comment": null, "last_update": "2022-03-24 07:51:36", "licence": "Database: Open Database, Contents: Database Contents", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102577\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Crowdedness-at-the-Campus-Gym", "Background When is my university campus gym least crowded, so I know when to work out? We measured how many people were in this gym once every 10 minutes over the last year. We want to be able to predict how crowded the gym will be in the future. Goals Given a time of day (and maybe some other features, including weather), predict how crowded the gym will be. Figure out which features are actually important, which are redundant, and what features could be added to make the predictions more accur " ], "weight": 5 }, "qualities": { "NumberOfInstances": 62184, "NumberOfFeatures": 11, "NumberOfClasses": null, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 10, "NumberOfSymbolicFeatures": 0, "Dimensionality": 0.0001768943779750418, "PercentageOfNumericFeatures": 90.9090909090909, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "AutoCorrelation": null, "PercentageOfMissingValues": 0 }, "tags": [ { "uploader": "38960", "tag": "Images" } ], "features": [ { "name": "number_people", "index": "0", "type": "numeric", "distinct": "128", "missing": "0", "min": "0", "max": "145", "mean": "29", "stdev": "23" }, { "name": "date", "index": "1", "type": "string", "distinct": "62184", "missing": "0" }, { "name": "timestamp", "index": "2", "type": "numeric", "distinct": "31321", "missing": "0", "min": "0", "max": "86399", "mean": "45799", "stdev": "24211" }, { "name": "day_of_week", "index": "3", "type": "numeric", "distinct": "7", "missing": "0", "min": "0", "max": "6", "mean": "3", "stdev": "2" }, { "name": "is_weekend", "index": "4", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "is_holiday", "index": "5", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "temperature", "index": "6", "type": "numeric", "distinct": "2599", "missing": "0", "min": "38", "max": "87", "mean": "59", "stdev": "6" }, { "name": "is_start_of_semester", "index": "7", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "is_during_semester", "index": "8", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "month", "index": "9", "type": "numeric", "distinct": "12", "missing": "0", "min": "1", "max": "12", "mean": "7", "stdev": "3" }, { "name": "hour", "index": "10", "type": "numeric", "distinct": "24", "missing": "0", "min": "0", "max": "23", "mean": "12", "stdev": "7" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }