In [1]:
import seaborn as sns
import matplotlib.pyplot as plt

In [None]:
sns.get_dataset_names()

In [None]:
tips = sns.load_dataset('tips')

In [None]:
tips

In [None]:
# Load dataset
iris = sns.load_dataset ("iris")
iris.head()


In [None]:
iris['species'].unique()

In [None]:
# Scatter plot using relplot
sns.relplot(x = "sepal_length", y = "sepal_width", hue="species", style="species", size="petal_length", data=iris)
plt.title("Scatter Plot with relplot")
plt.show()

In [None]:
# Scatter plot using scatterplot
sns.scatterplot(x="total_bill", y="tip", hue="time", style="time", size="size", data=tips)
plt.title("Scatter Plot with scatterplot")
plt.show()

In [None]:
# Load dataset
fmri = sns.load_dataset("fmri")
fmri.head(15)

In [None]:
fmri['region'].unique()

In [None]:
fmri['event'].unique()

In [None]:
fmri['timepoint'].unique()

In [None]:
# Line plot using lineplot
sns.lineplot(errorbar=None, x="timepoint", y="signal", hue="region", style="event", markers=True, dashes=False, data=fmri)
plt.title("Line Plot with lineplot")
plt.show()

In [None]:
tips.head()

In [None]:
plt.figure(figsize=(15, 6))
# Line plot using lineplot
sns.lineplot(errorbar=None,x="size", y="tip", hue="time", style="time", markers=True, dashes=False, data=tips)
plt.title("Line Plot with lineplot")
plt.show()

In [None]:
# Load dataset
titanic = sns.load_dataset ("titanic")
titanic.head()


In [None]:
# Displot with default kind (histogram)
sns.displot(titanic, x="age", multiple="stack", bins=30,   hue="sex", palette="magma", kind='hist') #kind=hist
plt.title("Displot with kind='hist'")
plt.xlabel("Age")
plt.ylabel("Count")
plt.show()

In [None]:
# Displot with kde
sns.displot(titanic, x="age", hue="sex", multiple="stack", palette="viridis", kind='kde') #kind=kde
plt.title("Displot with kind='kde'")
plt.xlabel("Age")
plt.ylabel("Count")
plt.show()

In [None]:
# Histogram plot
sns.histplot(data=titanic, x="age", hue="sex", multiple="stack", bins=30, palette="viridis", kde=True)
plt.title('Histogram with histplot')
plt.show()

In [None]:
# Histogram plot
sns.kdeplot(data=titanic, x="age", hue="sex", palette="viridis", fill=True)
plt.title('KDE plot with kdeplot')
plt.show()

In [None]:
diamonds = sns.load_dataset("diamonds")
diamonds.head()

In [None]:
# ECDF plot
sns.ecdfplot(data=diamonds, x="price", hue="cut")
plt.title('ECDF plot with ecdfplot')
plt.show()

In [None]:
# Load dataset
penguins = sns.load_dataset("penguins")
# Rug plot
sns.rugplot(data=penguins, x="flipper_length_mm", hue="species", height=0.1)
plt.ylim(0, 0.1)
plt.title('Rug Plot with rugplot')
plt.show()

In [None]:
import pandas as pd

In [None]:
adult = pd.read_csv('adult.csv')
adult.head()

In [None]:
# Load the dataset
url = "https://archive.ics.uci.edu/ml/machine-learning-databases/adult/adult.data"
column_names = [
    "age", "workclass", "fnlwgt", "education", "education_num",
    "marital_status", "occupation", "relationship", "race",
    "sex", "capital_gain", "capital_loss", "hours_per_week",
    "native_country", "income"
]

data = pd.read_csv(url, header=None, names=column_names, na_values='?', skipinitialspace=True)

# Display first few rows
data.head()


In [None]:

# Describe the dataset
data.describe()

In [None]:
# Plotting scatterplot with relplot
sns.relplot(data=data, x='age', y='hours_per_week',
    hue='income', kind='scatter', height=6,
    aspect=1.5, alpha=0.7)
plt.title('Scatter Plot of Age vs. Hours Worked per Week')
plt.xlabel('Age')
plt.ylabel('Hours per Week')
plt.show()

In [None]:
# Calculating average hours worked per week by age and income
avg_hours_per_age_income = data.groupby(['age', 'income'])['hours_per_week'].mean().reset_index()

# Plotting line plot using relplot
sns.relplot(data=avg_hours_per_age_income, x='age',
    y='hours_per_week', hue='income', kind='line',
    height=6, aspect=1.5, marker='o')
plt.title('Line Plot of Average Hours Worked per Week by Age')
plt.xlabel('Age')
plt.ylabel('Average Hours per Week')
plt.show()

In [None]:
# Plotting scatterplot using scatterplot()
sns.scatterplot(data=data, x='capital_gain',
    y='capital_loss', hue='income',
    palette='viridis', alpha=0.7)
plt.title('Scatter Plot of Capital Gain vs. Capital Loss')
plt.xlabel('Capital Gain')
plt.ylabel('Capital Loss')
plt.legend(title='Income')
plt.show()

In [None]:
# Calculating average hours worked per week by age and sex
avg_hours_per_age_sex = data.groupby(['age', 'sex'])['hours_per_week'].mean().reset_index()

# Plotting lineplot using lineplot()
sns.lineplot(data=avg_hours_per_age_sex, x='age',
    y='hours_per_week', hue='sex', marker='o')
plt.title('Line Plot of Average Hours Worked per Week by Age and Sex')
plt.xlabel('Age')
plt.ylabel('Average Hours per Week')
plt.show()

In [None]:
# Plotting histogram using displot()
sns.displot(data=data, x='age', bins=30,
    height=6, aspect=1.5, color='green')
plt.title('Histogram of Ages')
plt.xlabel('Age')
plt.ylabel('Frequency')
plt.show()