In [None]:
# # Cell 1: Load Iris Dataset
import pandas as pd

iris = pd.read_csv('/content/iris.csv', names=['sepal_length', 'sepal_width', 'petal_length', 'petal_width', 'class'])
iris.tail()

In [None]:
# # Cell 2: Iris Dataset Summary
iris.describe()

In [None]:
# # Cell 3: Scatter Plot - Petal Length vs Petal Width
import matplotlib.pyplot as plt

x = iris['petal_length']
y = iris['petal_width']
plt.scatter(x, y)
plt.title("Scatter Plot: Petal Length vs Petal Width")
plt.xlabel("Petal Length")
plt.ylabel("Petal Width")
plt.grid(True)
plt.show()

In [None]:
# # Cell 4: Scatter Plot - Sepal Length vs Sepal Width
fig, ax = plt.subplots()
ax.scatter(iris['sepal_length'], iris['sepal_width'])
ax.set_title('Iris Dataset: Sepal Dimensions')
ax.set_xlabel('Sepal Length')
ax.set_ylabel('Sepal Width')
plt.grid(True)
plt.show()

In [None]:
# # Cell 5: Color-coded Scatter Plot by Species
colors = {'Iris-setosa': 'r', 'Iris-versicolor': 'g', 'Iris-virginica': 'b'}
species_colors = iris['class'].map(colors)

fig, ax = plt.subplots()
ax.scatter(iris['sepal_length'], iris['sepal_width'], c=species_colors)
ax.set_title("Scatter Plot: Sepal Length vs Width by Species")
ax.set_xlabel('Sepal Length')
ax.set_ylabel('Sepal Width')
plt.grid(True)
plt.show()

In [None]:
# # Cell 6: Flower Count by Species
species_counts = iris['class'].value_counts()
plt.bar(species_counts.index, species_counts.values, color='lightblue')
plt.title("Number of Flowers by Species")
plt.xlabel("Species")
plt.ylabel("Count")
plt.grid(axis='y')
plt.show()

In [None]:
# # Cell 7: Distribution of Petal Length
plt.hist(iris['petal_length'], bins=10, color='lightgreen', edgecolor='black')
plt.title("Distribution of Petal Length")
plt.xlabel("Petal Length (cm)")
plt.ylabel("Frequency")
plt.grid(True)
plt.show()

In [None]:
# # Cell 8: Box Plot - Petal Length by Species
species = iris['class'].unique()
data = [iris[iris['class'] == s]['petal_length'] for s in species]

plt.boxplot(data, labels=species)
plt.title("Petal Length by Species")
plt.xlabel("Species")
plt.ylabel("Petal Length (cm)")
plt.grid(True)
plt.show()

In [None]:
# # Cell 9: Petal Length vs Width Relationship
plt.scatter(iris['petal_length'], iris['petal_width'], color='purple', alpha=0.6)
plt.title("Petal Length vs Petal Width")
plt.xlabel("Petal Length (cm)")
plt.ylabel("Petal Width (cm)")
plt.grid(True)
plt.show()

In [None]:
# # Cell 10: Load mtcars Dataset
df = pd.read_csv('/content/mtcars.csv')
df.head()

In [None]:
# # Cell 11: Scatter Plot - Car Weight vs MPG
plt.scatter(df['wt'], df['mpg'])
plt.title('Scatter Plot: Car Weight vs MPG')
plt.xlabel('Weight (1000 lbs)')
plt.ylabel('Miles per Gallon')
plt.grid(True)
plt.show()

In [None]:
# # Cell 12: Bar Plot - Transmission Types
auto_count = (df['am'] == 0).sum()
manual_count = (df['am'] == 1).sum()
labels = ['Automatic', 'Manual']
counts = [auto_count, manual_count]

plt.bar(labels, counts, color=['orange', 'blue'])
plt.title("Transmission Type Frequency")
plt.xlabel("Transmission Type")
plt.ylabel("Count")
plt.grid(axis='y')
plt.show()

In [None]:
# # Cell 13: Histogram of MPG
plt.hist(df['mpg'], bins=8, color='skyblue', edgecolor='black')
plt.title("Distribution of MPG")
plt.xlabel("Miles per Gallon")
plt.ylabel("Frequency")
plt.grid(True)
plt.show()

In [None]:
# # Cell 14: Box Plot - MPG
plt.boxplot(df['mpg'])
plt.title("Box Plot of MPG")
plt.ylabel("Miles per Gallon")
plt.grid(True)
plt.show()

In [None]:
# # Cell 15: MPG by Cylinders
cylinders = sorted(df['cyl'].unique())
data = [df[df['cyl'] == c]['mpg'] for c in cylinders]

plt.boxplot(data, labels=cylinders)
plt.title("MPG by Number of Cylinders")
plt.xlabel("Cylinders")
plt.ylabel("MPG")
plt.grid(True)
plt.show()

In [None]:
# # Cell 16: Cars by Gear Count
gear_counts = df['gear'].value_counts().sort_index()

plt.bar(gear_counts.index.astype(str), gear_counts.values, color='lightgreen')
plt.title("Number of Cars by Gear")
plt.xlabel("Gear")
plt.ylabel("Count")
plt.grid(axis='y')
plt.show()

In [None]:
# # Cell 17: Cars by Cylinder Count
cyl_counts = df['cyl'].value_counts().sort_index()

plt.bar(cyl_counts.index.astype(str), cyl_counts.values, color='skyblue')
plt.title("Number of Cars by Cylinder Count")
plt.xlabel("Cylinders")
plt.ylabel("Number of Cars")
plt.grid(axis='y')
plt.show()

In [None]:
# # Cell 18: Load Student Performance Dataset
sp = pd.read_csv('/content/StudentsPerformance.csv')
sp.head()

In [None]:
# # Cell 19: Gender Distribution
gender_counts = sp['gender'].value_counts()
plt.bar(gender_counts.index, gender_counts.values, color=['blue', 'pink'])
plt.title("Student Count by Gender")
plt.xlabel("Gender")
plt.ylabel("Count")
plt.grid(axis='y')
plt.show()

In [None]:
# # Cell 20: Math Score Distribution
plt.hist(sp['math score'], bins=10, color='lightblue', edgecolor='black')
plt.title("Math Score Distribution")
plt.xlabel("Math Score")
plt.ylabel("Number of Students")
plt.grid(True)
plt.show()

In [None]:
# # Cell 21: Math Scores by Gender (Box Plot)
genders = sp['gender'].unique()
data = [sp[sp['gender'] == g]['math score'] for g in genders]

plt.boxplot(data, labels=genders)
plt.title("Math Score by Gender")
plt.xlabel("Gender")
plt.ylabel("Math Score")
plt.grid(True)
plt.show()

In [None]:
# # Cell 22: Test Preparation Course Completion
prep_counts = sp['test preparation course'].value_counts()
plt.bar(prep_counts.index, prep_counts.values, color=['green', 'orange'])
plt.title("Test Preparation Course Completion")
plt.xlabel("Course Status")
plt.ylabel("Count")
plt.grid(axis='y')
plt.show()

In [None]:
# # Cell 23: Reading vs Writing Score
plt.scatter(sp['reading score'], sp['writing score'], color='purple', alpha=0.5)
plt.title("Reading vs Writing Score")
plt.xlabel("Reading Score")
plt.ylabel("Writing Score")
plt.grid(True)
plt.show()

In [None]:
# # Cell 24: Seaborn Box Plot Comparison
import seaborn as sns
import numpy as np

data1 = np.random.normal(0, 1, 1000)
data2 = np.random.normal(2, 1, 1000)

sns.boxplot(data=[data1, data2])
plt.xlabel("Distribution")
plt.ylabel("Value")
plt.title("Box Plot Comparison of Two Distributions")
plt.grid(True)
plt.show()