In [2]:
import pandas as pd
import glob

# Get a list of all Excel files in the folder
excel_files = glob.glob("Wages*.xlsx")

# Create an empty list to store the dataframes
dfs = []

# Loop through each Excel file and read it into a dataframe
for file in excel_files:
    df = pd.read_excel(file)
    # Convert 'amount' column to numeric, coercing non-numeric values to NaN
    df["amount"] = pd.to_numeric(df["amount"], errors="coerce")
    dfs.append(df)

# Concatenate all dataframes into a single dataframe
combined_df = pd.concat(dfs, ignore_index=True)

# Get all unique packages
all_packages = combined_df["package"].unique()

# Create a dictionary to store the total amount for each package
package_totals = {}

# Calculate the total amount for each package
for package in all_packages:
    package_totals[package] = combined_df[combined_df["package"] == package]["amount"].sum()

# Create a new dataframe from the package totals
final_df = pd.DataFrame(list(package_totals.items()), columns=["Package", "Total Amount"])

# Save the final dataframe to a new Excel file
final_df.to_excel("Package_Totals.xlsx", index=False)