# Udemy Data Analysis - Jupyter Notebook

In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# Load dataset
df = pd.read_csv("udemy_courses.csv")
df.head()


## Basic Statistics and Info

In [None]:
df.info()
df.describe()


## Top Rated Courses

In [None]:
top_rated = df.sort_values(by="Rating", ascending=False)
top_rated[['Title', 'Instructor', 'Rating']].head()


## Course Ratings Distribution

In [None]:
plt.figure(figsize=(8, 5))
sns.histplot(df['Rating'], bins=5, kde=True)
plt.title("Distribution of Course Ratings")
plt.xlabel("Rating")
plt.ylabel("Frequency")
plt.grid(True)
plt.show()


## Correlation Heatmap

In [None]:
plt.figure(figsize=(8, 5))
sns.heatmap(df.corr(numeric_only=True), annot=True, cmap="YlGnBu")
plt.title("Correlation Heatmap")
plt.show()


## Instructor-wise Average Rating

In [None]:
instructor_avg = df.groupby('Instructor')['Rating'].mean().sort_values(ascending=False)
instructor_avg.plot(kind='bar', figsize=(8, 5), title='Average Rating per Instructor')
plt.ylabel("Average Rating")
plt.grid(axis='y')
plt.show()
