{ "data_id": "43653", "name": "NBA-PLAYERS--2016-2019", "exact_name": "NBA-PLAYERS--2016-2019", "version": 1, "version_label": "v1.0", "description": "Context\nThis Dataset was created for an University project in Milan. The goal of the project was to create a Robust Model to predict the All Star Game score for each player. \nThe score is calculated by dividing the players by conference and position held in the field (external or internal),\nthe athletes are ranked in descending order depending on the number of votes taken for each category\nvoter, so as to obtain three different rankings. From these for each player the rank is calculated (1st\nPosition involves Rank = 1, 2nd Position Rank = 2 etc. . . ). With the values obtained then an average is calculated\nweighed, with weight 0.50 to that of the votes of the fans and 0.25 to the two remaining.\nDoing this work we have merged some datasets from kaggle (https:\/\/www.kaggle.com\/noahgift\/social-power-nba), basketball-reference.com and hoopshype.com.\nObviously for our work we didn't use all of the variables and for a problem of indipendent observations we took only the last seasons' observation for each player.\nOther analysis could be performed using salary as a target but also a cluster analysis for players or a PCA.\nWe wouldn't be here without the help of others. Thank you Riccardo,Alfredo and Daniel.\nSome variables:\nPOS1= Main position (some players have a second position called POS2)\nG= Games played\nGS= Games started\nMP= Minutes played\nFG =Field Goals Per Game\nFGA=Field Goal Attempts Per Game\nFG.= Field Goal Percentage\nX3P= 3-Point Field Goals Per Game\nX3PA= 3-Point Field Goal Attempts Per Game\nX3P.= FG on 3-Pt FGAs.\nX2P =2-Point Field Goals Per Game\nX2PA =2-Point Field Goal Attempts Per Game\nX2P.= FG on 2-Pt FGAs.\neFG. = Effective Field Goal Percentage\nFT=Free Throws Per Game\nFTA = Free Throw Attempts Per Game\nFT.= Free Throw Percentage\nORB = Offensive Rebounds Per Game\nDRB = Defensive Rebounds Per Game\nTRB = Total Rebounds Per Game\nAST = Assists Per Game\nSTL= Steals Per Game\nBLK = Blocks Per Game\nTOV = Turnovers Per Game\nPF = Personal Fouls Per Game\nPTS =Points Per Game\nMEAN_VIEWS= Daily views on wikipedia\nPLAY= If the player played in the all star game", "format": "arff", "uploader": "Dustin Carrion", "uploader_id": 30123, "visibility": "public", "creator": null, "contributor": null, "date": "2022-03-24 01:01:51", "update_comment": null, "last_update": "2022-03-24 01:01:51", "licence": "CC0: Public Domain", "status": "active", "error_message": null, "url": "https:\/\/www.openml.org\/data\/download\/22102478\/dataset", "default_target_attribute": null, "row_id_attribute": null, "ignore_attribute": null, "runs": 0, "suggest": { "input": [ "NBA-PLAYERS--2016-2019", "Context This Dataset was created for an University project in Milan. The goal of the project was to create a Robust Model to predict the All Star Game score for each player. The score is calculated by dividing the players by conference and position held in the field (external or internal), the athletes are ranked in descending order depending on the number of votes taken for each category voter, so as to obtain three different rankings. From these for each player the rank is calculated (1st Posi " ], "weight": 5 }, "qualities": { "NumberOfInstances": 1408, "NumberOfFeatures": 45, "NumberOfClasses": null, "NumberOfMissingValues": 2891, "NumberOfInstancesWithMissingValues": 1398, "NumberOfNumericFeatures": 36, "NumberOfSymbolicFeatures": 0, "Dimensionality": 0.03196022727272727, "PercentageOfNumericFeatures": 80, "MajorityClassPercentage": null, "PercentageOfSymbolicFeatures": 0, "MajorityClassSize": null, "MinorityClassPercentage": null, "MinorityClassSize": null, "NumberOfBinaryFeatures": 0, "PercentageOfBinaryFeatures": 0, "PercentageOfInstancesWithMissingValues": 99.28977272727273, "AutoCorrelation": null, "PercentageOfMissingValues": 4.562815656565657 }, "tags": [ { "uploader": "38960", "tag": "Computer Systems" }, { "uploader": "38960", "tag": "Machine Learning" } ], "features": [ { "name": "Rk", "index": "0", "type": "numeric", "distinct": "539", "missing": "0", "min": "1", "max": "540", "mean": "258", "stdev": "151" }, { "name": "Player.x", "index": "1", "type": "string", "distinct": "660", "missing": "0" }, { "name": "Player_ID", "index": "2", "type": "string", "distinct": "660", "missing": "0" }, { "name": "Pos1", "index": "3", "type": "string", "distinct": "5", "missing": "0" }, { "name": "Pos2", "index": "4", "type": "string", "distinct": "4", "missing": "1396" }, { "name": "Age", "index": "5", "type": "numeric", "distinct": "24", "missing": "0", "min": "19", "max": "42", "mean": "26", "stdev": "4" }, { "name": "Tm", "index": "6", "type": "string", "distinct": "30", "missing": "0" }, { "name": "G", "index": "7", "type": "numeric", "distinct": "82", "missing": "0", "min": "1", "max": "82", "mean": "54", "stdev": "24" }, { "name": "GS", "index": "8", "type": "numeric", "distinct": "83", "missing": "0", "min": "0", "max": "82", "mean": "26", "stdev": "29" }, { "name": "MP", "index": "9", "type": "numeric", "distinct": "344", "missing": "0", "min": "1", "max": "38", "mean": "20", "stdev": "9" }, { "name": "FG", "index": "10", "type": "numeric", "distinct": "104", "missing": "0", "min": "0", "max": "11", "mean": "3", "stdev": "2" }, { "name": "FGA", "index": "11", "type": "numeric", "distinct": "200", "missing": "0", "min": "0", "max": "25", "mean": "7", "stdev": "5" }, { "name": "FG.", "index": "12", "type": "numeric", "distinct": "331", "missing": "4", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "X3P", "index": "13", "type": "numeric", "distinct": "41", "missing": "0", "min": "0", "max": "5", "mean": "1", "stdev": "1" }, { "name": "X3PA", "index": "14", "type": "numeric", "distinct": "90", "missing": "0", "min": "0", "max": "13", "mean": "2", "stdev": "2" }, { "name": "X3P.", "index": "15", "type": "numeric", "distinct": "260", "missing": "99", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "X2P", "index": "16", "type": "numeric", "distinct": "85", "missing": "0", "min": "0", "max": "10", "mean": "2", "stdev": "2" }, { "name": "X2PA", "index": "17", "type": "numeric", "distinct": "154", "missing": "0", "min": "0", "max": "19", "mean": "5", "stdev": "3" }, { "name": "X2P.", "index": "18", "type": "numeric", "distinct": "337", "missing": "15", "min": "0", "max": "1", "mean": "0", "stdev": "0" }, { "name": "eFG.", "index": "19", "type": "numeric", "distinct": "311", "missing": "4", "min": "0", "max": "2", "mean": "1", "stdev": "0" }, { "name": "FT", "index": "20", "type": "numeric", "distinct": "76", "missing": "0", "min": "0", "max": "10", "mean": "1", "stdev": "1" }, { "name": "FTA", "index": "21", "type": "numeric", "distinct": "89", "missing": "0", "min": "0", "max": "11", "mean": "2", "stdev": "2" }, { "name": "FT.", "index": "22", "type": "numeric", "distinct": "370", "missing": "47", "min": "0", "max": "1", "mean": "1", "stdev": "0" }, { "name": "ORB", "index": "23", "type": "numeric", "distinct": "46", "missing": "0", "min": "0", "max": "5", "mean": "1", "stdev": "1" }, { "name": "DRB", "index": "24", "type": "numeric", "distinct": "96", "missing": "0", "min": "0", "max": "11", "mean": "3", "stdev": "2" }, { "name": "TRB", "index": "25", "type": "numeric", "distinct": "122", "missing": "0", "min": "0", "max": "16", "mean": "4", "stdev": "2" }, { "name": "AST", "index": "26", "type": "numeric", "distinct": "91", "missing": "0", "min": "0", "max": "11", "mean": "2", "stdev": "2" }, { "name": "STL", "index": "27", "type": "numeric", "distinct": "24", "missing": "0", "min": "0", "max": "2", "mean": "1", "stdev": "0" }, { "name": "BLK", "index": "28", "type": "numeric", "distinct": "28", "missing": "0", "min": "0", "max": "3", "mean": "0", "stdev": "0" }, { "name": "TOV", "index": "29", "type": "numeric", "distinct": "47", "missing": "0", "min": "0", "max": "6", "mean": "1", "stdev": "1" }, { "name": "PF", "index": "30", "type": "numeric", "distinct": "41", "missing": "0", "min": "0", "max": "4", "mean": "2", "stdev": "1" }, { "name": "PTS", "index": "31", "type": "numeric", "distinct": "248", "missing": "0", "min": "0", "max": "36", "mean": "9", "stdev": "6" }, { "name": "Salary", "index": "32", "type": "numeric", "distinct": "832", "missing": "62", "min": "56845", "max": "37457154", "mean": "6790048", "stdev": "7452558" }, { "name": "mean_views", "index": "33", "type": "numeric", "distinct": "1084", "missing": "138", "min": "1", "max": "34148", "mean": "989", "stdev": "2131" }, { "name": "Season", "index": "34", "type": "string", "distinct": "3", "missing": "0" }, { "name": "Conference", "index": "35", "type": "string", "distinct": "2", "missing": "0" }, { "name": "Role", "index": "36", "type": "string", "distinct": "2", "missing": "0" }, { "name": "Fvot", "index": "37", "type": "numeric", "distinct": "1357", "missing": "0", "min": "3", "max": "4620809", "mean": "117696", "stdev": "428627" }, { "name": "FRank", "index": "38", "type": "numeric", "distinct": "145", "missing": "0", "min": "1", "max": "145", "mean": "62", "stdev": "37" }, { "name": "Pvot", "index": "39", "type": "numeric", "distinct": "85", "missing": "159", "min": "0", "max": "269", "mean": "8", "stdev": "26" }, { "name": "PRank", "index": "40", "type": "numeric", "distinct": "51", "missing": "159", "min": "1", "max": "88", "mean": "43", "stdev": "23" }, { "name": "Mvot", "index": "41", "type": "numeric", "distinct": "38", "missing": "404", "min": "0", "max": "100", "mean": "3", "stdev": "15" }, { "name": "MRank", "index": "42", "type": "numeric", "distinct": "9", "missing": "404", "min": "1", "max": "9", "mean": "7", "stdev": "1" }, { "name": "Score", "index": "43", "type": "numeric", "distinct": "572", "missing": "0", "min": "1", "max": "167", "mean": "76", "stdev": "41" }, { "name": "Play", "index": "44", "type": "string", "distinct": "2", "missing": "0" } ], "nr_of_issues": 0, "nr_of_downvotes": 0, "nr_of_likes": 0, "nr_of_downloads": 0, "total_downloads": 0, "reach": 0, "reuse": 0, "impact_of_reuse": 0, "reach_of_reuse": 0, "impact": 0 }