In [None]:
# Cell 1: Import Necessary Libraries
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
import seaborn as sns

# Load cleaned dataset
file_path = 'F:\Mytraining\DataAnalystBootcamp\Python\Data analysis with python\Axion Ray- Assesement\DATask 2.csv'
df = pd.read_csv(file_path)


In [None]:
# Cell 2: Convert REPAIR_DATE to datetime format
df['REPAIR_DATE'] = pd.to_datetime(df['REPAIR_DATE'])


In [None]:
# Cell 3: Monthly Repair Trends Extraction
df['Month_Year'] = df['REPAIR_DATE'].dt.to_period('M')
monthly_repairs = df.groupby('Month_Year').size().reset_index(name='Repair_Count')

# Display Monthly Repair Trends
print("Monthly Repair Trends:")
print(monthly_repairs.head())


In [None]:
# Cell 4: Most Common Repair Types Extraction
repair_counts = df['GLOBAL_LABOR_CODE_DESCRIPTION'].value_counts().reset_index()
repair_counts.columns = ['Repair_Type', 'Count']

# Display Top 10 Repair Types
print("\nTop 10 Most Common Repair Types:")
print(repair_counts.head(10))


In [None]:
# Cell 5: Platform-Based Repairs Extraction
platform_repairs = df['PLATFORM'].value_counts().reset_index()
platform_repairs.columns = ['Platform', 'Repair_Count']

# Display Repair Counts by Platform
print("\nRepair Counts by Platform:")
print(platform_repairs)


In [None]:
# Cell 6: Repair Age Analysis
repair_age_summary = df['REPAIR_AGE'].describe()

# Display Repair Age Statistics
print("\nRepair Age Summary:")
print(repair_age_summary)


In [None]:
# Cell 7: Total Repair Cost Analysis
total_cost_summary = df['TOTALCOST'].describe()

# Display Total Cost Statistics
print("\nRepair Cost Summary:")
print(total_cost_summary)


In [None]:
# Cell 8: Visualization - Monthly Repair Trends
sns.set(style="whitegrid")
plt.figure(figsize=(15, 10))

plt.subplot(2, 2, 1)
monthly_repairs.plot(x='Month_Year', y='Repair_Count', kind='bar', color='blue')
plt.title('Monthly Repair Trends')
plt.xlabel('Month-Year')
plt.ylabel('Number of Repairs')
plt.xticks(rotation=45)


In [None]:
# Cell 9: Visualization - Top Repair Types
plt.subplot(2, 2, 2)
sns.barplot(x='Count', y='Repair_Type', data=repair_counts.head(10), palette='Oranges_r')
plt.title('Top 10 Most Common Repair Types')
plt.xlabel('Repair Count')
plt.ylabel('Repair Type')


In [None]:
# Cell 10: Visualization - Platform-Based Repair Distribution
plt.subplot(2, 1, 2)
sns.barplot(x='Platform', y='Repair_Count', data=platform_repairs, palette='coolwarm')
plt.title('Repairs by Vehicle Platform')
plt.xlabel('Platform')
plt.ylabel('Number of Repairs')
plt.xticks(rotation=45)

plt.tight_layout()
plt.savefig('KPI_Analysis.png', dpi=300)
plt.show()


In [None]:
# Cell 11: Save KPI Extracted Data into CSV files
kpi_summary_file = 'KPI_Summary.csv'
monthly_repairs.to_csv(kpi_summary_file, index=False)
repair_counts.to_csv('Top_Repairs.csv', index=False)
platform_repairs.to_csv('Platform_Repairs.csv', index=False)

print(f"\nKPI Summary data saved to {kpi_summary_file}")
