{ "data_id": "41555", "name": "scpf", "exact_name": "scpf", "version": 3, "version_label": null, "description": "Multivariate regression data set from: https:\/\/link.springer.com\/article\/10.1007%2Fs10994-016-5546-z : This is a pre-processed version of the dataset used in Kaggles See Click Predict Fix competition (Kaggle 2013). It concerns the prediction of three target variables that represent the number of views, clicks and comments that a specific 311 issue will receive. The issues have been collected from 4 cities (Oakland, Richmond, New Haven, Chicago) in the US and span a period of 12 months (01 2012-12 2012). The version of the dataset that we use here is a random 1 percent sample of the data. In terms of features we use the number of days that an issues stayed online, the source from where the issue was created (e.g. android, iphone, remote api, etc.), the type of the issue (e.g. graffiti, pothole, trash, etc.), the geographical co-ordinates of the issue, the city it was published from and the distance from the city center. All multi-valued nominal variables were first transformed to binary and then rare binary variables (being true for less than 1 percent of the cases) were removed.", "format": "ARFF", "uploader": "Quay Au", "uploader_id": 2373, "visibility": "public", "creator": null, "contributor": null, "date": "2019-04-03 09:01:16", "update_comment": null, "last_update": "2019-04-03 09:01:16", "licence": "Public", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/21241899\/file20386dbb5661.arff", "default_target_attribute": "num_views,num_votes,num_comments", "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "scpf", "Multivariate regression data set from: https:\/\/link.springer.com\/article\/10.1007%2Fs10994-016-5546-z : This is a pre-processed version of the dataset used in Kaggles See Click Predict Fix competition (Kaggle 2013). It concerns the prediction of three target variables that represent the number of views, clicks and comments that a specific 311 issue will receive. The issues have been collected from 4 cities (Oakland, Richmond, New Haven, Chicago) in the US and span a period of 12 months (01 2012-1 " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1137, "NumberOfFeatures": 26, "NumberOfClasses": null, "NumberOfMissingValues": 9255, "NumberOfInstancesWithMissingValues": 994, "NumberOfNumericFeatures": 26, "NumberOfSymbolicFeatures": 0, "ClassEntropy": null, "MeanNoiseToSignalRatio": null, "Quartile2AttributeEntropy": null, "Dimensionality": 0.022867194371152155, "MeanNominalAttDistinctValues": null, "Quartile2KurtosisOfNumericAtts": 11.373873417236027, "EquivalentNumberOfAtts": null, "MeanSkewnessOfNumericAtts": 4.190241416135885, "Quartile2MeansOfNumericAtts": 0.09867663612750036, "MajorityClassPercentage": null, "MeanStdDevOfNumericAtts": 5.713316388007543, "Quartile2MutualInformation": null, "MajorityClassSize": null, "MinAttributeEntropy": null, "Quartile2SkewnessOfNumericAtts": 3.6060439246902667, "MaxAttributeEntropy": null, "MinKurtosisOfNumericAtts": -1.8078993706245141, "PercentageOfBinaryFeatures": 0, "Quartile2StdDevOfNumericAtts": 0.2984804167620109, "MaxKurtosisOfNumericAtts": 387.1929709080521, "MinMeansOfNumericAtts": -88.02821958135443, "PercentageOfInstancesWithMissingValues": 87.42304309586632, "Quartile3AttributeEntropy": null, "MaxMeansOfNumericAtts": 349.9665787159191, "MinMutualInformation": null, "PercentageOfMissingValues": 31.30708341790136, "Quartile3KurtosisOfNumericAtts": 31.074766114950503, "MaxMutualInformation": null, "MinNominalAttDistinctValues": null, "PercentageOfNumericFeatures": 100, "Quartile3MeansOfNumericAtts": 0.4340048872922708, "MaxNominalAttDistinctValues": null, "MinSkewnessOfNumericAtts": -1.8702573109321898, "PercentageOfSymbolicFeatures": 0, "Quartile3MutualInformation": null, "MaxSkewnessOfNumericAtts": 17.351438617321147, "MinStdDevOfNumericAtts": 0.09324809599273752, "Quartile1AttributeEntropy": null, "Quartile3SkewnessOfNumericAtts": 5.734669487493385, "MaxStdDevOfNumericAtts": 88.96058991537119, "MinorityClassPercentage": null, "Quartile1KurtosisOfNumericAtts": 0.5113027591909952, "Quartile3StdDevOfNumericAtts": 0.563233468567389, "MeanAttributeEntropy": null, "MinorityClassSize": null, "Quartile1MeansOfNumericAtts": 0.03644314868804668, "StdvNominalAttDistinctValues": null, "MeanKurtosisOfNumericAtts": 45.55438821528992, "NumberOfBinaryFeatures": 0, "Quartile1MutualInformation": null, "MeanMeansOfNumericAtts": 12.30270002453851, "Quartile1SkewnessOfNumericAtts": 1.0172595766184696, "AutoCorrelation": null, "MeanMutualInformation": null, "Quartile1StdDevOfNumericAtts": 0.19235206875192914 }, "tags": [ { "uploader": "2373", "tag": "2019_multioutput_paper_benchmark_data" }, { "uploader": "38960", "tag": "Culture" }, { "uploader": "38960", "tag": "Social Media" } ], "features": [ { "name": "num_views", "index": "23", "type": "numeric", "distinct": "96", "missing": "0", "target": "1", "min": "0", "max": "938", "mean": "13", "stdev": "38" }, { "name": "num_votes", "index": "24", "type": "numeric", "distinct": "11", "missing": "0", "target": "1", "min": "1", "max": "22", "mean": "2", "stdev": "1" }, { "name": "num_comments", "index": "25", "type": "numeric", "distinct": "9", "missing": "0", "target": "1", "min": "0", "max": "20", "mean": "0", "stdev": "1" }, { "name": "daysUntilLastIssue", "index": "0", "type": "numeric", "distinct": "268", "missing": "0", "min": "259", "max": "623", "mean": "350", "stdev": "89" }, { "name": "source_city_initiated", "index": "1", "type": "numeric", "distinct": "2", "missing": "263", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "source_android", "index": "2", "type": "numeric", "distinct": "2", "missing": "263", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "source_remote_api_created", "index": "3", "type": "numeric", "distinct": "2", "missing": "263", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "source_new_map_widget", "index": "4", "type": "numeric", "distinct": "2", "missing": "263", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "source_iphone", "index": "5", "type": "numeric", "distinct": "2", "missing": "263", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_tree", "index": "6", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_street_light", "index": "7", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_graffiti", "index": "8", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_pothole", "index": "9", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_signs", "index": "10", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_overgrowth", "index": "11", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_traffic", "index": "12", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_trash", "index": "13", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_blighted_property", "index": "14", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "tag_type_sidewalk", "index": "15", "type": "numeric", "distinct": "2", "missing": "794", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "latitude", "index": "16", "type": "numeric", "distinct": "1127", "missing": "0", "min": "37", "max": "42", "mean": "40", "stdev": "2" }, { "name": "longitude", "index": "17", "type": "numeric", "distinct": "1125", "missing": "0", "min": "-122", "max": "0", "mean": "-88", "stdev": "12" }, { "name": "city_Oakland", "index": "18", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "city_Chicago", "index": "19", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "city_NH", "index": "20", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "city_Richmond", "index": "21", "type": "numeric", "distinct": "2", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "distanceFromCenter", "index": "22", "type": "numeric", "distinct": "1127", "missing": "0", "min": "0", "max": "1", "mean": "0", "stdev": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }