{ "data_id": "43655", "name": "Football---Expected-Goals-Match-Statistics", "exact_name": "Football---Expected-Goals-Match-Statistics", "version": 1, "version_label": "v1.0", "description": "Context\nIn recent years statisticians and data scientists alike have been trying to come up with new ways to evaluate team performance in Football. Sometimes a result is not a fair reflection on a teams performance, and this is where expected goals come in. \nExpected goals is a relatively new football metric, using quality of passing and goalscoring opportunities to rank a teams performance. Understat.com provides these statistics by using neural networks to approximate this data and I have therefore scraped statistics for matches played between the 2014-15 and 2019-2020 seasons to provide the following dataset.\nThe Leagues included in this representation are:\n\nEnglish Premier League\nLa Liga\nBundesliga\nSerie A\nLigue 1\nRussian Football Premier League\n\nContent\nThe dataset contains 22 columns, a lot of which will be self explanatory such as date, home team etc. Some of the less common features will be outlined below:\nChance - the percentage prediction of an outcome based on expected goals.\nExpected Goals - the number of goals a team is expected to score based on performance.\nDeep - number of passes completed within an estimated 20 yards from goal.\nPPDA - number of passes allowed per defensive action in the opposition half.\nExpected Points - number of points a team is expected to achieve in this game.\nInspiration\nIs the expected goals feature an accurate representation of a teams performance?\nHow can this feature be improved?\nCan we predict the outcome of future games based on previous games?", "format": "arff", "uploader": "Dustin Carrion", "uploader_id": 30123, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-24 01:02:12", "update_comment": null, "last_update": "2022-03-24 01:02:12", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102480\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "Football---Expected-Goals-Match-Statistics", "Context In recent years statisticians and data scientists alike have been trying to come up with new ways to evaluate team performance in Football. Sometimes a result is not a fair reflection on a teams performance, and this is where expected goals come in. Expected goals is a relatively new football metric, using quality of passing and goalscoring opportunities to rank a teams performance. Understat.com provides these statistics by using neural networks to approximate this data and I have there " ], "weight": 5 }, "qualities": { "NumberOfInstances": 10791, "NumberOfFeatures": 22, "NumberOfClasses": null, "NumberOfMissingValues": 0, "NumberOfInstancesWithMissingValues": 0, "NumberOfNumericFeatures": 15, "NumberOfSymbolicFeatures": 0, "Dimensionality": 0.0020387359836901123, "PercentageOfNumericFeatures": 68.18181818181817, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 0, "AutoCorrelation": null, "PercentageOfMissingValues": 0 }, "tags": [ { "uploader": "38960", "tag": "Computer Systems" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "Unnamed:_0", "index": "0", "type": "numeric", "distinct": "10791", "missing": "0", "min": "0", "max": "10790", "mean": "5395", "stdev": "3115" }, { "name": "Date", "index": "1", "type": "string", "distinct": "1072", "missing": "0" }, { "name": "League", "index": "2", "type": "string", "distinct": "6", "missing": "0" }, { "name": "Home_Team", "index": "3", "type": "string", "distinct": "163", "missing": "0" }, { "name": "Away_Team", "index": "4", "type": "string", "distinct": "163", "missing": "0" }, { "name": "Home_Chance_%", "index": "5", "type": "string", "distinct": "87", "missing": "0" }, { "name": "Draw_Chance_%", "index": "6", "type": "string", "distinct": "62", "missing": "0" }, { "name": "Away_Chance_%", "index": "7", "type": "string", "distinct": "87", "missing": "0" }, { "name": "Home_Goals", "index": "8", "type": "numeric", "distinct": "11", "missing": "0", "min": "0", "max": "10", "mean": "2", "stdev": "1" }, { "name": "Away_Goals", "index": "9", "type": "numeric", "distinct": "10", "missing": "0", "min": "0", "max": "9", "mean": "1", "stdev": "1" }, { "name": "Home_Expected_Goals", "index": "10", "type": "numeric", "distinct": "488", "missing": "0", "min": "0", "max": "7", "mean": "1", "stdev": "1" }, { "name": "Away_Expected_Goals", "index": "11", "type": "numeric", "distinct": "417", "missing": "0", "min": "0", "max": "6", "mean": "1", "stdev": "1" }, { "name": "Home_Shots", "index": "12", "type": "numeric", "distinct": "43", "missing": "0", "min": "0", "max": "47", "mean": "14", "stdev": "5" }, { "name": "Away_Shots", "index": "13", "type": "numeric", "distinct": "35", "missing": "0", "min": "0", "max": "34", "mean": "11", "stdev": "5" }, { "name": "Home_Shots_on_Target", "index": "14", "type": "numeric", "distinct": "19", "missing": "0", "min": "0", "max": "18", "mean": "5", "stdev": "3" }, { "name": "Away_Shots_on_Target", "index": "15", "type": "numeric", "distinct": "16", "missing": "0", "min": "0", "max": "15", "mean": "4", "stdev": "2" }, { "name": "Home_Deep", "index": "16", "type": "numeric", "distinct": "36", "missing": "0", "min": "0", "max": "35", "mean": "6", "stdev": "4" }, { "name": "Away_Deep", "index": "17", "type": "numeric", "distinct": "30", "missing": "0", "min": "0", "max": "29", "mean": "5", "stdev": "4" }, { "name": "Home_PPDA", "index": "18", "type": "numeric", "distinct": "1922", "missing": "0", "min": "2", "max": "97", "mean": "10", "stdev": "5" }, { "name": "Away_PPDA", "index": "19", "type": "numeric", "distinct": "2139", "missing": "0", "min": "2", "max": "152", "mean": "11", "stdev": "7" }, { "name": "Home_Expected_Points", "index": "20", "type": "numeric", "distinct": "301", "missing": "0", "min": "0", "max": "3", "mean": "2", "stdev": "1" }, { "name": "Away_Expected_Points", "index": "21", "type": "numeric", "distinct": "301", "missing": "0", "min": "0", "max": "3", "mean": "1", "stdev": "1" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }