In [1]:
# import Pandas
import pandas as pd

# import os
import os

# import numpy
import numpy as np

# import pyplot
import matplotlib.pyplot as plt

In [2]:
# Input data
# 1) NBA Player Stats since 1950
# https://www.kaggle.com/drgilermo/nba-players-stats
# Flat file (CSV) dataset from Kaggle
player_stats_inp = pd.read_csv(os.path.join("Seasons_Stats.csv"))
player_stats_inp.head()

Unnamed: 0.1,Unnamed: 0,Year,Player,Pos,Age,Tm,G,GS,MP,PER,...,FT%,ORB,DRB,TRB,AST,STL,BLK,TOV,PF,PTS
0,0,1950.0,Curly Armstrong,G-F,31.0,FTW,63.0,,,,...,0.705,,,,176.0,,,,217.0,458.0
1,1,1950.0,Cliff Barker,SG,29.0,INO,49.0,,,,...,0.708,,,,109.0,,,,99.0,279.0
2,2,1950.0,Leo Barnhorst,SF,25.0,CHS,67.0,,,,...,0.698,,,,140.0,,,,192.0,438.0
3,3,1950.0,Ed Bartels,F,24.0,TOT,15.0,,,,...,0.559,,,,20.0,,,,29.0,63.0
4,4,1950.0,Ed Bartels,F,24.0,DNN,13.0,,,,...,0.548,,,,20.0,,,,27.0,59.0


In [3]:
# Clean up the player stats data to get ready for merging
# keep useful columns
player_stats_df = player_stats_inp[["Year", "Player", "Age", "Tm","PER","GS","ORB","TRB","DRB","MP","G","TS%","FTr","OWS","DWS","WS","WS/48","FG%","2P","2PA","2P%","eFG%","PF","3P%","FT%","FG","FGA","3P","3PA","FT","FTA","PTS", "AST", "STL", "BLK", "TOV","ORB%","DRB%","TRB%","AST%","STL%","BLK%","TOV%","USG%","OBPM","DBPM","BPM","VORP"]]

# Get rid of NaN values
player_stats_df = player_stats_df.dropna()

# Make the values that should be integer integer
player_stats_df.Year = player_stats_df.Year.astype(int)
player_stats_df.Age = player_stats_df.Age.astype(int)

# rname column
player_stats_df = player_stats_df.rename(columns={"Player": "Name","G":"GP"})

# Delete the * in the name column to keep consistant
player_stats_df['Name'] = player_stats_df['Name'].apply(lambda x: x.replace("*", ""))

#ratio of Games started to games played
player_stats_df["GS/GP"]=player_stats_df["GS"]/player_stats_df["GP"]

#removing last row from dataset because it's null
# player_stats_df=player_stats_df[:-1]

player_stats_df

Unnamed: 0,Year,Name,Age,Tm,PER,GS,ORB,TRB,DRB,MP,...,AST%,STL%,BLK%,TOV%,USG%,OBPM,DBPM,BPM,VORP,GS/GP
5730,1980,Tiny Archibald,31,BOS,15.3,80.0,59.0,197.0,138.0,2864.0,...,30.2,1.7,0.2,19.7,17.0,1.1,-1.1,0.0,1.5,1.000000
5748,1980,Larry Bird,23,BOS,20.5,82.0,216.0,852.0,636.0,2955.0,...,18.5,2.3,1.0,14.0,25.3,2.7,2.6,5.3,5.4,1.000000
5781,1980,M.L. Carr,29,BOS,14.6,7.0,106.0,330.0,224.0,1994.0,...,10.7,2.8,1.0,14.1,20.2,-0.2,1.5,1.3,1.7,0.085366
5786,1980,Don Chaney,33,BOS,7.8,0.0,31.0,73.0,42.0,523.0,...,9.3,2.8,1.2,13.7,18.3,-4.0,0.9,-3.1,-0.1,0.000000
5802,1980,Dave Cowens,31,BOS,14.8,55.0,126.0,534.0,408.0,2159.0,...,13.4,1.5,1.6,9.9,20.1,-0.7,2.0,1.4,1.8,0.833333
5835,1980,Chris Ford,31,BOS,13.0,73.0,77.0,181.0,104.0,2115.0,...,13.5,2.5,0.7,12.2,16.2,1.4,0.8,2.2,2.2,1.000000
5867,1980,Gerald Henderson,24,BOS,12.7,2.0,37.0,83.0,46.0,1061.0,...,19.0,2.0,0.8,19.9,20.5,-1.5,-0.9,-2.4,-0.1,0.026316
5901,1980,Jeff Judkins,23,BOS,14.1,0.0,32.0,66.0,34.0,674.0,...,9.9,2.0,0.4,13.7,21.1,0.2,-1.4,-1.3,0.1,0.000000
5947,1980,Pete Maravich,32,TOT,13.8,4.0,17.0,78.0,61.0,964.0,...,13.8,1.2,0.4,12.2,28.9,-2.0,-3.8,-5.8,-0.9,0.093023
5949,1980,Pete Maravich,32,BOS,15.6,4.0,10.0,38.0,28.0,442.0,...,10.4,1.0,0.3,11.9,27.9,-0.9,-3.3,-4.2,-0.2,0.153846


In [4]:
#player_stats_df should be a on a per-game basis instead of totals to eliminate the effect of games played
player_stats_df["MPG"]=player_stats_df["MP"]/player_stats_df["GP"]
player_stats_df["ORPG"]=player_stats_df["ORB"]/player_stats_df["GP"]
player_stats_df["DRPG"]=player_stats_df["DRB"]/player_stats_df["GP"]
player_stats_df["RPG"]=player_stats_df["TRB"]/player_stats_df["GP"]
player_stats_df["APG"]=player_stats_df["AST"]/player_stats_df["GP"]
player_stats_df["SPG"]=player_stats_df["STL"]/player_stats_df["GP"]
player_stats_df["BPG"]=player_stats_df["BLK"]/player_stats_df["GP"]
player_stats_df["TPG"]=player_stats_df["TOV"]/player_stats_df["GP"]
player_stats_df["PFPG"]=player_stats_df["PF"]/player_stats_df["GP"]
player_stats_df["PPG"]=player_stats_df["PTS"]/player_stats_df["GP"]
player_stats_df["FGPG"]=player_stats_df["FG"]/player_stats_df["GP"]
player_stats_df["FGAPG"]=player_stats_df["FGA"]/player_stats_df["GP"]
player_stats_df["3PPG"]=player_stats_df["3P"]/player_stats_df["GP"]
player_stats_df["3PAPG"]=player_stats_df["3PA"]/player_stats_df["GP"]
player_stats_df["2PPG"]=player_stats_df["2P"]/player_stats_df["GP"]
player_stats_df["2PAPG"]=player_stats_df["2PA"]/player_stats_df["GP"]
player_stats_df["FTPG"]=player_stats_df["FT"]/player_stats_df["GP"]
player_stats_df["FTAPG"]=player_stats_df["FTA"]/player_stats_df["GP"]

#drop all total columns
drop_column = ['MP', 'ORB', 'DRB', 'TRB', 'AST', 'STL', 'BLK', 'TOV', 'PF', 'PTS', 'FG', 'FGA', '3P', '2P', '2PA', 'FT', 'FTA']
player_stats_df.drop(drop_column, axis=1, inplace = True)

In [5]:
player_stats_df_unique = player_stats_df.groupby(['Year','Name']).mean()
player_stats_df_unique


Unnamed: 0_level_0,Unnamed: 1_level_0,Age,PER,GS,GP,TS%,FTr,OWS,DWS,WS,WS/48,...,PFPG,PPG,FGPG,FGAPG,3PPG,3PAPG,2PPG,2PAPG,FTPG,FTAPG
Year,Name,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1,Unnamed: 22_level_1
1980,Chris Ford,31.0,13.000000,73.000000,73.000000,0.537000,0.161000,2.900000,2.600000,5.600000,0.126000,...,2.438356,11.178082,4.520548,9.712329,0.958904,2.246575,3.561644,7.465753,1.178082,1.561644
1980,Dave Cowens,31.0,14.800000,55.000000,66.000000,0.477000,0.131000,1.900000,3.600000,5.400000,0.121000,...,3.272727,14.242424,6.393939,14.121212,0.015152,0.181818,6.378788,13.939394,1.439394,1.848485
1980,Don Chaney,33.0,7.800000,0.000000,60.000000,0.402000,0.222000,-0.400000,0.800000,0.400000,0.033000,...,1.333333,2.783333,1.116667,3.150000,0.016667,0.100000,1.100000,3.050000,0.533333,0.700000
1980,Gerald Henderson,24.0,12.700000,2.000000,76.000000,0.539000,0.338000,0.500000,1.200000,1.700000,0.078000,...,1.263158,6.223684,2.513158,5.026316,0.026316,0.078947,2.486842,4.947368,1.171053,1.697368
1980,Jeff Judkins,23.0,14.100000,0.000000,65.000000,0.567000,0.275000,1.100000,0.800000,1.800000,0.131000,...,1.400000,5.400000,2.138462,4.246154,0.169231,0.415385,1.969231,3.830769,0.953846,1.169231
1980,Larry Bird,23.0,20.500000,82.000000,82.000000,0.538000,0.246000,5.600000,5.600000,11.200000,0.182000,...,3.402439,21.280488,8.451220,17.841463,0.707317,1.743902,7.743902,16.097561,3.670732,4.390244
1980,M.L. Carr,29.0,14.600000,7.000000,82.000000,0.526000,0.316000,1.900000,3.200000,5.200000,0.125000,...,2.609756,11.146341,4.414634,9.304878,0.146341,0.500000,4.268293,8.804878,2.170732,2.939024
1980,Pete Maravich,32.0,14.700000,4.000000,34.500000,0.523500,0.207000,0.350000,0.400000,0.750000,0.068500,...,1.860912,12.598837,5.202594,11.102415,0.173971,0.251342,5.028623,10.851073,2.019678,2.278623
1980,Rick Robey,24.0,15.400000,27.000000,82.000000,0.557000,0.370000,2.800000,2.700000,5.500000,0.139000,...,2.975610,11.487805,4.621951,8.865854,0.000000,0.012195,4.621951,8.853659,2.243902,3.280488
1980,Tiny Archibald,31.0,15.300000,80.000000,80.000000,0.574000,0.548000,5.900000,2.900000,8.900000,0.148000,...,2.725000,14.137500,4.787500,9.925000,0.050000,0.225000,4.737500,9.700000,4.512500,5.437500


In [6]:
player_stats_df_unique=player_stats_df_unique.reset_index(level=[0,1])

In [7]:
player_stats_df_unique.to_csv('player_stats_clean.csv',index=False)

In [9]:
salary_df = pd.read_csv(os.path.join("../salary/salary_drop_repeat_10_16.csv"))
physical_df = pd.read_csv(os.path.join("../physical_characteristics/phy_chara_clean.csv"))
cap_df = pd.read_csv(os.path.join("../salary_cap/salary_cap_clean.csv"))
injuries_df = pd.read_csv(os.path.join("../injuries/injuries_very_clean.csv"))


In [10]:
injuries_df.head()

Unnamed: 0,Year,Name,Injury_DTD,Injury_DNP,Injury_Out_Indef,Injury_Out_Season,Injury_Returned,Injury_Other
0,2010,Al Harrington,0,0,0,0,0,0
1,2010,Anderson Varejao,0,0,0,0,0,0
2,2010,Andre Iguodala,0,1,0,0,0,0
3,2010,Andrea Bargnani,0,2,0,0,0,0
4,2010,Andrew Bogut,0,6,0,0,0,0


In [11]:
# injuries_df.rename(index=str, columns={"Date": "Year"},inplace=True)
# injuries_df.rename(index=str, columns={"Player": "Name"},inplace=True)
injuries_df.head()

Unnamed: 0,Year,Name,Injury_DTD,Injury_DNP,Injury_Out_Indef,Injury_Out_Season,Injury_Returned,Injury_Other
0,2010,Al Harrington,0,0,0,0,0,0
1,2010,Anderson Varejao,0,0,0,0,0,0
2,2010,Andre Iguodala,0,1,0,0,0,0
3,2010,Andrea Bargnani,0,2,0,0,0,0
4,2010,Andrew Bogut,0,6,0,0,0,0


In [12]:
player_salary_df = pd.merge(player_stats_df_unique, salary_df, on=["Year","Name"])
player_salary_df.head(30)

Unnamed: 0,Year,Name,Age,PER,GS,GP,TS%,FTr,OWS,DWS,...,PPG,FGPG,FGAPG,3PPG,3PAPG,2PPG,2PAPG,FTPG,FTAPG,Salary
0,2010,Aaron Brooks,25.0,16.0,82.0,82.0,0.549,0.224,3.9,1.6,...,19.560976,7.012195,16.231707,2.54878,6.402439,4.463415,9.829268,2.987805,3.634146,2016692.0
1,2010,Acie Law,25.0,15.05,0.5,13.0,0.584,0.6905,0.175,0.075,...,4.455983,1.362927,2.803098,0.18141,0.581624,1.181517,2.221474,1.548718,1.978098,633253.0
2,2010,Al Harrington,29.0,16.8,15.0,72.0,0.546,0.308,2.2,1.3,...,17.722222,6.222222,14.305556,1.944444,5.680556,4.277778,8.625,3.333333,4.402778,5765000.0
3,2010,Al Horford,23.0,19.4,81.0,81.0,0.594,0.319,6.9,3.9,...,14.17284,5.765432,10.45679,0.012346,0.012346,5.753086,10.444444,2.62963,3.333333,5444857.0
4,2010,Al Jefferson,25.0,19.0,76.0,76.0,0.524,0.236,2.3,2.3,...,17.118421,7.368421,14.802632,0.0,0.052632,7.368421,14.75,2.381579,3.5,13000000.0
5,2010,Al Thornton,26.0,11.833333,30.666667,50.0,0.522,0.315667,0.8,0.666667,...,10.710588,4.24902,9.01098,0.164902,0.465392,4.084118,8.545588,2.047647,2.846275,211084.0
6,2010,Alando Tucker,25.0,14.55,0.0,13.0,0.5385,0.619,0.15,0.0,...,3.654545,1.157576,2.663636,0.078788,0.551515,1.078788,2.112121,1.260606,1.654545,1071720.0
7,2010,Allen Iverson,34.0,14.466667,16.0,18.666667,0.538,0.429,0.333333,0.133333,...,13.334444,4.899048,10.51746,0.324921,0.72873,4.574127,9.78873,3.211429,4.479524,650686.0
8,2010,Alonzo Gee,22.0,16.2,2.0,11.0,0.564,0.492,0.3,0.1,...,7.363636,2.545455,5.363636,0.636364,0.818182,1.909091,4.545455,1.636364,2.636364,641141.0
9,2010,Amar'e Stoudemire,27.0,22.6,82.0,82.0,0.615,0.5,8.2,2.5,...,23.121951,8.585366,15.414634,0.012195,0.073171,8.573171,15.341463,5.939024,7.707317,16486611.0


In [13]:
player_salary_physical_df = pd.merge(player_salary_df, physical_df, on=["Year","Name"])

In [14]:
player_salary_physical_cap_df = pd.merge(player_salary_physical_df, cap_df, on=["Year"])
player_salary_physical_cap_df

Unnamed: 0,Year,Name,Age,PER,GS,GP,TS%,FTr,OWS,DWS,...,3PPG,3PAPG,2PPG,2PAPG,FTPG,FTAPG,Salary,player_height,player_weight,Salary Cap
0,2010,Aaron Brooks,25.0,16.000000,82.000000,82.000000,0.549000,0.224000,3.900000,1.600000,...,2.548780,6.402439,4.463415,9.829268,2.987805,3.634146,2016692.0,182.88,73.028312,57700000
1,2010,Acie Law,25.0,15.050000,0.500000,13.000000,0.584000,0.690500,0.175000,0.075000,...,0.181410,0.581624,1.181517,2.221474,1.548718,1.978098,633253.0,190.50,91.625584,57700000
2,2010,Al Harrington,29.0,16.800000,15.000000,72.000000,0.546000,0.308000,2.200000,1.300000,...,1.944444,5.680556,4.277778,8.625000,3.333333,4.402778,5765000.0,205.74,113.398000,57700000
3,2010,Al Horford,23.0,19.400000,81.000000,81.000000,0.594000,0.319000,6.900000,3.900000,...,0.012346,0.012346,5.753086,10.444444,2.629630,3.333333,5444857.0,208.28,111.130040,57700000
4,2010,Al Jefferson,25.0,19.000000,76.000000,76.000000,0.524000,0.236000,2.300000,2.300000,...,0.000000,0.052632,7.368421,14.750000,2.381579,3.500000,13000000.0,208.28,127.005760,57700000
5,2010,Al Thornton,26.0,11.833333,30.666667,50.000000,0.522000,0.315667,0.800000,0.666667,...,0.164902,0.465392,4.084118,8.545588,2.047647,2.846275,211084.0,203.20,106.594120,57700000
6,2010,Alonzo Gee,22.0,16.200000,2.000000,11.000000,0.564000,0.492000,0.300000,0.100000,...,0.636364,0.818182,1.909091,4.545455,1.636364,2.636364,641141.0,198.12,99.790240,57700000
7,2010,Amar'e Stoudemire,27.0,22.600000,82.000000,82.000000,0.615000,0.500000,8.200000,2.500000,...,0.012195,0.073171,8.573171,15.341463,5.939024,7.707317,16486611.0,208.28,108.862080,57700000
8,2010,Anderson Varejao,27.0,15.800000,7.000000,76.000000,0.598000,0.375000,4.300000,3.800000,...,0.013158,0.065789,3.500000,6.078947,1.526316,2.302632,7281818.0,210.82,117.933920,57700000
9,2010,Andray Blatche,23.0,17.600000,36.000000,81.000000,0.519000,0.234000,0.800000,2.600000,...,0.160494,0.543210,5.740741,11.790123,2.148148,2.888889,5904152.0,210.82,117.933920,57700000


In [15]:
player_salary_physical_cap_df.to_csv('player_salary_physical_cap_df.csv',index=False)

In [16]:
player_salary_physical_cap_injuries_df = pd.merge(player_salary_physical_cap_df, injuries_df, on=["Year","Name"],how="left")

In [17]:
player_salary_physical_cap_injuries_df

Unnamed: 0,Year,Name,Age,PER,GS,GP,TS%,FTr,OWS,DWS,...,Salary,player_height,player_weight,Salary Cap,Injury_DTD,Injury_DNP,Injury_Out_Indef,Injury_Out_Season,Injury_Returned,Injury_Other
0,2010,Aaron Brooks,25.0,16.000000,82.000000,82.000000,0.549000,0.224000,3.900000,1.600000,...,2016692.0,182.88,73.028312,57700000,,,,,,
1,2010,Acie Law,25.0,15.050000,0.500000,13.000000,0.584000,0.690500,0.175000,0.075000,...,633253.0,190.50,91.625584,57700000,,,,,,
2,2010,Al Harrington,29.0,16.800000,15.000000,72.000000,0.546000,0.308000,2.200000,1.300000,...,5765000.0,205.74,113.398000,57700000,0.0,0.0,0.0,0.0,0.0,0.0
3,2010,Al Horford,23.0,19.400000,81.000000,81.000000,0.594000,0.319000,6.900000,3.900000,...,5444857.0,208.28,111.130040,57700000,,,,,,
4,2010,Al Jefferson,25.0,19.000000,76.000000,76.000000,0.524000,0.236000,2.300000,2.300000,...,13000000.0,208.28,127.005760,57700000,,,,,,
5,2010,Al Thornton,26.0,11.833333,30.666667,50.000000,0.522000,0.315667,0.800000,0.666667,...,211084.0,203.20,106.594120,57700000,,,,,,
6,2010,Alonzo Gee,22.0,16.200000,2.000000,11.000000,0.564000,0.492000,0.300000,0.100000,...,641141.0,198.12,99.790240,57700000,,,,,,
7,2010,Amar'e Stoudemire,27.0,22.600000,82.000000,82.000000,0.615000,0.500000,8.200000,2.500000,...,16486611.0,208.28,108.862080,57700000,,,,,,
8,2010,Anderson Varejao,27.0,15.800000,7.000000,76.000000,0.598000,0.375000,4.300000,3.800000,...,7281818.0,210.82,117.933920,57700000,0.0,0.0,0.0,0.0,0.0,0.0
9,2010,Andray Blatche,23.0,17.600000,36.000000,81.000000,0.519000,0.234000,0.800000,2.600000,...,5904152.0,210.82,117.933920,57700000,,,,,,


In [18]:
player_salary_physical_cap_injuries_df = player_salary_physical_cap_injuries_df.fillna(0)

In [19]:
player_salary_physical_cap_injuries_df

Unnamed: 0,Year,Name,Age,PER,GS,GP,TS%,FTr,OWS,DWS,...,Salary,player_height,player_weight,Salary Cap,Injury_DTD,Injury_DNP,Injury_Out_Indef,Injury_Out_Season,Injury_Returned,Injury_Other
0,2010,Aaron Brooks,25.0,16.000000,82.000000,82.000000,0.549000,0.224000,3.900000,1.600000,...,2016692.0,182.88,73.028312,57700000,0.0,0.0,0.0,0.0,0.0,0.0
1,2010,Acie Law,25.0,15.050000,0.500000,13.000000,0.584000,0.690500,0.175000,0.075000,...,633253.0,190.50,91.625584,57700000,0.0,0.0,0.0,0.0,0.0,0.0
2,2010,Al Harrington,29.0,16.800000,15.000000,72.000000,0.546000,0.308000,2.200000,1.300000,...,5765000.0,205.74,113.398000,57700000,0.0,0.0,0.0,0.0,0.0,0.0
3,2010,Al Horford,23.0,19.400000,81.000000,81.000000,0.594000,0.319000,6.900000,3.900000,...,5444857.0,208.28,111.130040,57700000,0.0,0.0,0.0,0.0,0.0,0.0
4,2010,Al Jefferson,25.0,19.000000,76.000000,76.000000,0.524000,0.236000,2.300000,2.300000,...,13000000.0,208.28,127.005760,57700000,0.0,0.0,0.0,0.0,0.0,0.0
5,2010,Al Thornton,26.0,11.833333,30.666667,50.000000,0.522000,0.315667,0.800000,0.666667,...,211084.0,203.20,106.594120,57700000,0.0,0.0,0.0,0.0,0.0,0.0
6,2010,Alonzo Gee,22.0,16.200000,2.000000,11.000000,0.564000,0.492000,0.300000,0.100000,...,641141.0,198.12,99.790240,57700000,0.0,0.0,0.0,0.0,0.0,0.0
7,2010,Amar'e Stoudemire,27.0,22.600000,82.000000,82.000000,0.615000,0.500000,8.200000,2.500000,...,16486611.0,208.28,108.862080,57700000,0.0,0.0,0.0,0.0,0.0,0.0
8,2010,Anderson Varejao,27.0,15.800000,7.000000,76.000000,0.598000,0.375000,4.300000,3.800000,...,7281818.0,210.82,117.933920,57700000,0.0,0.0,0.0,0.0,0.0,0.0
9,2010,Andray Blatche,23.0,17.600000,36.000000,81.000000,0.519000,0.234000,0.800000,2.600000,...,5904152.0,210.82,117.933920,57700000,0.0,0.0,0.0,0.0,0.0,0.0


In [20]:
player_salary_physical_cap_injuries_df['Salary%'] = (player_salary_physical_cap_injuries_df['Salary']/player_salary_physical_cap_injuries_df['Salary Cap'])*100

In [21]:
player_salary_physical_cap_injuries_df

Unnamed: 0,Year,Name,Age,PER,GS,GP,TS%,FTr,OWS,DWS,...,player_height,player_weight,Salary Cap,Injury_DTD,Injury_DNP,Injury_Out_Indef,Injury_Out_Season,Injury_Returned,Injury_Other,Salary%
0,2010,Aaron Brooks,25.0,16.000000,82.000000,82.000000,0.549000,0.224000,3.900000,1.600000,...,182.88,73.028312,57700000,0.0,0.0,0.0,0.0,0.0,0.0,3.495133
1,2010,Acie Law,25.0,15.050000,0.500000,13.000000,0.584000,0.690500,0.175000,0.075000,...,190.50,91.625584,57700000,0.0,0.0,0.0,0.0,0.0,0.0,1.097492
2,2010,Al Harrington,29.0,16.800000,15.000000,72.000000,0.546000,0.308000,2.200000,1.300000,...,205.74,113.398000,57700000,0.0,0.0,0.0,0.0,0.0,0.0,9.991334
3,2010,Al Horford,23.0,19.400000,81.000000,81.000000,0.594000,0.319000,6.900000,3.900000,...,208.28,111.130040,57700000,0.0,0.0,0.0,0.0,0.0,0.0,9.436494
4,2010,Al Jefferson,25.0,19.000000,76.000000,76.000000,0.524000,0.236000,2.300000,2.300000,...,208.28,127.005760,57700000,0.0,0.0,0.0,0.0,0.0,0.0,22.530329
5,2010,Al Thornton,26.0,11.833333,30.666667,50.000000,0.522000,0.315667,0.800000,0.666667,...,203.20,106.594120,57700000,0.0,0.0,0.0,0.0,0.0,0.0,0.365830
6,2010,Alonzo Gee,22.0,16.200000,2.000000,11.000000,0.564000,0.492000,0.300000,0.100000,...,198.12,99.790240,57700000,0.0,0.0,0.0,0.0,0.0,0.0,1.111163
7,2010,Amar'e Stoudemire,27.0,22.600000,82.000000,82.000000,0.615000,0.500000,8.200000,2.500000,...,208.28,108.862080,57700000,0.0,0.0,0.0,0.0,0.0,0.0,28.572983
8,2010,Anderson Varejao,27.0,15.800000,7.000000,76.000000,0.598000,0.375000,4.300000,3.800000,...,210.82,117.933920,57700000,0.0,0.0,0.0,0.0,0.0,0.0,12.620135
9,2010,Andray Blatche,23.0,17.600000,36.000000,81.000000,0.519000,0.234000,0.800000,2.600000,...,210.82,117.933920,57700000,0.0,0.0,0.0,0.0,0.0,0.0,10.232499


In [22]:
player_salary_physical_cap_injuries_df.to_csv('final_combine_player_data.csv',index=False)