In [2]:
import pandas as pd

# Charger les fichiers CSV
teams = pd.read_csv('team.csv')
team_details = pd.read_csv('team_details.csv')
player_details = pd.read_csv('player_details.csv')

# Afficher les colonnes de chaque DataFrame pour débogage
print("Colonnes dans teams:", list(teams.columns))
print("Colonnes dans team_details:", list(team_details.columns))
print("Colonnes dans player_details:", list(player_details.columns))

# Première étape : joindre teams et team_details
# On utilisera l'abbreviation comme clé de jointure
base_teams = pd.merge(teams, team_details, 
                      on='abbreviation', 
                      how='left', 
                      suffixes=('_teams', '_details'))

# Deuxième étape : joindre avec player_details
# On utilisera team_abbreviation comme clé de jointure
base_finale = pd.merge(base_teams, player_details, 
                       left_on='abbreviation', 
                       right_on='team_abbreviation', 
                       how='left')

# Afficher les colonnes du DataFrame final
print("\nColonnes dans base_finale:", list(base_finale.columns))

# Sauvegarder le résultat sans filtrage de colonnes
base_finale.to_csv('base_finale.csv', index=False)

print("Jointure terminée. Fichier base_finale.csv créé.")
print(f"Nombre de lignes : {len(base_finale)}")

Colonnes dans teams: ['id', 'full_name', 'abbreviation', 'nickname', 'city', 'state', 'year_founded']
Colonnes dans team_details: ['team_id', 'abbreviation', 'nickname', 'yearfounded', 'city', 'arena', 'arenacapacity', 'owner', 'generalmanager', 'headcoach', 'dleagueaffiliation', 'facebook', 'instagram', 'twitter']
Colonnes dans player_details: ['Unnamed: 0', 'player_name', 'team_abbreviation', 'age', 'player_height', 'player_weight', 'college', 'country', 'draft_year', 'draft_round', 'draft_number', 'gp', 'pts', 'reb', 'ast', 'net_rating', 'oreb_pct', 'dreb_pct', 'usg_pct', 'ts_pct', 'ast_pct', 'season']

Colonnes dans base_finale: ['id', 'full_name', 'abbreviation', 'nickname_teams', 'city_teams', 'state', 'year_founded', 'team_id', 'nickname_details', 'yearfounded', 'city_details', 'arena', 'arenacapacity', 'owner', 'generalmanager', 'headcoach', 'dleagueaffiliation', 'facebook', 'instagram', 'twitter', 'Unnamed: 0', 'player_name', 'team_abbreviation', 'age', 'player_height', 'playe

In [3]:
base_finale

Unnamed: 0,id,full_name,abbreviation,nickname_teams,city_teams,state,year_founded,team_id,nickname_details,yearfounded,...,pts,reb,ast,net_rating,oreb_pct,dreb_pct,usg_pct,ts_pct,ast_pct,season
0,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,5.7,1.6,1.3,-0.3,0.036,0.076,0.172,0.539,0.141,1996-97
1,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,6.7,1.5,0.4,1.2,0.034,0.067,0.171,0.555,0.036,1996-97
2,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,4.9,1.7,2.0,5.0,0.031,0.087,0.152,0.535,0.193,1996-97
3,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,1.4,2.8,0.3,2.5,0.104,0.189,0.083,0.439,0.042,1996-97
4,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,18.1,8.8,2.7,11.0,0.084,0.186,0.236,0.562,0.133,1996-97
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
12064,1610612766,Charlotte Hornets,CHA,Hornets,Charlotte,North Carolina,1988.0,1.610613e+09,Hornets,1988.0,...,20.3,5.2,1.1,-7.7,0.038,0.121,0.257,0.534,0.057,2022-23
12065,1610612766,Charlotte Hornets,CHA,Hornets,Charlotte,North Carolina,1988.0,1.610613e+09,Hornets,1988.0,...,9.0,7.1,0.4,-4.7,0.106,0.232,0.168,0.659,0.033,2022-23
12066,1610612766,Charlotte Hornets,CHA,Hornets,Charlotte,North Carolina,1988.0,1.610613e+09,Hornets,1988.0,...,23.3,6.4,8.4,-4.7,0.031,0.147,0.289,0.541,0.352,2022-23
12067,1610612766,Charlotte Hornets,CHA,Hornets,Charlotte,North Carolina,1988.0,1.610613e+09,Hornets,1988.0,...,5.6,2.1,1.2,-8.3,0.015,0.116,0.192,0.463,0.117,2022-23


In [4]:
df = pd.read_csv('base_finale.csv')
df

Unnamed: 0,id,full_name,abbreviation,nickname_teams,city_teams,state,year_founded,team_id,nickname_details,yearfounded,...,pts,reb,ast,net_rating,oreb_pct,dreb_pct,usg_pct,ts_pct,ast_pct,season
0,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,5.7,1.6,1.3,-0.3,0.036,0.076,0.172,0.539,0.141,1996-97
1,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,6.7,1.5,0.4,1.2,0.034,0.067,0.171,0.555,0.036,1996-97
2,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,4.9,1.7,2.0,5.0,0.031,0.087,0.152,0.535,0.193,1996-97
3,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,1.4,2.8,0.3,2.5,0.104,0.189,0.083,0.439,0.042,1996-97
4,1610612737,Atlanta Hawks,ATL,Hawks,Atlanta,Atlanta,1949.0,1.610613e+09,Hawks,1949.0,...,18.1,8.8,2.7,11.0,0.084,0.186,0.236,0.562,0.133,1996-97
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
12064,1610612766,Charlotte Hornets,CHA,Hornets,Charlotte,North Carolina,1988.0,1.610613e+09,Hornets,1988.0,...,20.3,5.2,1.1,-7.7,0.038,0.121,0.257,0.534,0.057,2022-23
12065,1610612766,Charlotte Hornets,CHA,Hornets,Charlotte,North Carolina,1988.0,1.610613e+09,Hornets,1988.0,...,9.0,7.1,0.4,-4.7,0.106,0.232,0.168,0.659,0.033,2022-23
12066,1610612766,Charlotte Hornets,CHA,Hornets,Charlotte,North Carolina,1988.0,1.610613e+09,Hornets,1988.0,...,23.3,6.4,8.4,-4.7,0.031,0.147,0.289,0.541,0.352,2022-23
12067,1610612766,Charlotte Hornets,CHA,Hornets,Charlotte,North Carolina,1988.0,1.610613e+09,Hornets,1988.0,...,5.6,2.1,1.2,-8.3,0.015,0.116,0.192,0.463,0.117,2022-23
