# 🚖 Ola Data Analysis Project

This notebook provides insights into the Ola ride bookings dataset, including vehicle usage, revenue, cancellations, and ratings analysis.

In [None]:
# Import necessary libraries
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load data
df = pd.read_csv('sqlnew.csv')

# Display basic information
df.info()
df.head()

In [None]:
# Bookings per vehicle type
vehicle_counts = df['Vehicle Type'].value_counts()
vehicle_counts.plot(kind='bar', title='Bookings per Vehicle Type', color='skyblue')
plt.ylabel('Number of Bookings')
plt.xlabel('Vehicle Type')
plt.tight_layout()
plt.show()

In [None]:
# Revenue by vehicle type
df['Revenue'] = df['Cost of Trip']
revenue = df.groupby('Vehicle Type')['Revenue'].sum().sort_values(ascending=False)
revenue.plot(kind='bar', title='Revenue by Vehicle Type', color='orange')
plt.ylabel('Total Revenue')
plt.tight_layout()
plt.show()

In [None]:
# Cancellations pie chart
cancel_counts = df['Cancellation'].value_counts()
cancel_counts.plot(kind='pie', autopct='%1.1f%%', title='Cancellation Rate', colors=['green', 'red'])
plt.ylabel('')
plt.tight_layout()
plt.show()

In [None]:
# Ratings distribution
sns.histplot(df['Ratings'], bins=5, kde=True)
plt.title("Distribution of Ratings")
plt.xlabel("Ratings")
plt.ylabel("Frequency")
plt.tight_layout()
plt.show()