In [1]:
import pandas as pd

def extract_and_save_formwork_data(file_path1, file_path2, output_file_path):
  """
  Reads two Excel files, extracts rows where 'package' is "0301 - Formwork", 
  concatenates the data, and saves it to a new Excel file.

  Args:
    file_path1: Path to the first Excel file.
    file_path2: Path to the second Excel file.
    output_file_path: Path to save the extracted data.
  """
  try:
    df1 = pd.read_excel(file_path1)
    df2 = pd.read_excel(file_path2)
  except FileNotFoundError:
    print(f"Error: One or both files not found.")
    return

  # Filter data for "0301 - Formwork" package in both DataFrames
  df1_filtered = df1[df1['package'] == "0301 - Formwork"]
  df2_filtered = df2[df2['package'] == "0301 - Formwork"]

  # Concatenate the filtered DataFrames
  combined_df = pd.concat([df1_filtered, df2_filtered], ignore_index=True)

  # Save the combined DataFrame to a new Excel file
  combined_df.to_excel(output_file_path, index=False)
  print(f"Extracted data saved to: {output_file_path}")


# File paths
file_path1 = "D:/OneDrive/OneDrive - Rowad Modern Engineering/x004 Data Science/03.rme.db/01.tables/02.manual/02.wages/00.all/04.xlsx.dated/All_Wages_Part1.xlsx"
file_path2 = "D:/OneDrive/OneDrive - Rowad Modern Engineering/x004 Data Science/03.rme.db/01.tables/02.manual/02.wages/00.all/04.xlsx.dated/All_Wages_Part2.xlsx"
output_file_path = "D:/OneDrive/OneDrive - Rowad Modern Engineering/x004 Data Science/03.rme.db/01.tables/02.manual/02.wages/00.all/04.xlsx.dated/formwork_data.xlsx"

# Extract and save the data
extract_and_save_formwork_data(file_path1, file_path2, output_file_path)

Extracted data saved to: D:/OneDrive/OneDrive - Rowad Modern Engineering/x004 Data Science/03.rme.db/01.tables/02.manual/02.wages/00.all/04.xlsx.dated/formwork_data.xlsx
