# Combining All Teams into a Single DataFrame

## Importing Libraries

In [1]:
import pandas as pd
import os

## Defining Directory and File Names

In [2]:
data_dir = "../../data/teams/raw"
files = [
    "premier_league_teams.csv",
    "serie_a_teams.csv",
    "la_liga_teams.csv",
    "bundesliga_teams.csv",
    "ligue_1_teams.csv"
]

# Assign readable league names
league_labels = {
    "premier_league_teams.csv": "Premier League",
    "serie_a_teams.csv": "Serie A",
    "la_liga_teams.csv": "La Liga",
    "bundesliga_teams.csv": "Bundesliga",
    "ligue_1_teams.csv": "Ligue 1"
}

combined = []

## Reading and Processing Each File

In [3]:
for file in files:
    path = os.path.join(data_dir, file)
    if os.path.exists(path):
        df = pd.read_csv(path)
        df["League"] = league_labels[file]
        df = df[["League", "Club Name"]]
        df.columns = ["League", "Team Name"]
        combined.append(df)
    else:
        print(f"⚠️ File not found: {file}")

## Combining All Files into a Single DataFrame

In [None]:
if combined:
    final_df = pd.concat(combined, ignore_index=True)
    final_df.to_csv("../../data/teams/cleaned/all_league_teams.csv", index=False)
    print("✅ Saved to '../../data/teams/cleaned/all_league_teams.csv'")
else:
    print("❌ No team data found to merge.")

✅ Saved to 'data/all_league_teams.csv'
