In [None]:
import pandas as pd

def process_data(input_file, output_file):
    # Read the input CSV into a DataFrame
    df = pd.read_csv(input_file)

    # Rename columns
    df = df.rename(columns={"Calendar day": "Calendar_Day", "Tertiary Quantity": "Tertiary_Quantity"})

    # Select specific columns
    df = df[["Calendar_Day", "Actual_Model_Name", "Category", "Business", "Remarks", "Tertiary_Quantity"]]

    # Filter rows based on 'Remarks' column
    df = df[(df.Remarks == 'CBU') | (df.Remarks == 'SKD')]

    # Reset the index
    df = df.reset_index(drop=True)

    # Define name changes dictionary
    name_change = {
        "LAVA_A1Colors_MF": "LAVA_A1",
        "LAVA PULSE_MF": "A7_BT_PULSE",
        "LAVA_A7_2020_MF": "LF7000_A7",
        "LAVA_A1WAVE_MF": "LAVA_A1",
        "LAVA_A7WAVE_MF": "LAVA_A7",
        "LAVA_A9WAVE_MF": "LAVA_A9",
        "LF5000_A5WAVE_MF": "LF5000_A5",
        "A1_JOSH2021_MF": "A1_JOSH2021",
        "A1_JOSH2021_New_MF": "A1_JOSH2021",
        "LF1000_A1_2021_MF": "LF1000_A1_2021",
        "LF1000_A1_2021_New_MF": "LF1000_A1_2021",
        "A1_TAMIL_VIBE": "LF1008_A1_VIBE"
    }

    # Replace values in 'Actual_Model_Name' column using the name_change dictionary
    df['Actual_Model_Name'] = df['Actual_Model_Name'].replace(name_change)

    # Convert 'Calendar_Day' to datetime
    df['Calendar_Day'] = pd.to_datetime(df['Calendar_Day'])

    # Modify 'Calendar_Day' to set the day to 1
    df['Calendar_Day'] = pd.to_datetime(pd.DataFrame({
        'day': 1,
        'month': df['Calendar_Day'].dt.month,
        'year': df['Calendar_Day'].dt.year
    }, index=df.index))

    # Remove "_MF" from 'Actual_Model_Name'
    df['Actual_Model_Name'] = df['Actual_Model_Name'].str.replace("_MF", "")

    # Save the processed data to the output file
    df.to_csv(output_file, index=False)

# Call the function with your input and output file paths
process_data('tertiaryData.csv', 'tertiaryData_for_KumarReport.csv')