In [None]:
import pandas as pd

# Load dataset
sleep_url = "https://raw.githubusercontent.com/bloominstituteoftechnology/data-science-practice-datasets/main/unit_1/Sleep/sleep.csv"
Sleep = pd.read_csv(sleep_url)

# Display the first 5 rows
print(Sleep.head())

In [None]:
import matplotlib.pyplot as plt
import seaborn as sns

# Create histogram
fig, ax = plt.subplots()
ax.hist(Sleep['Parasleep'], bins=10, color='skyblue', edgecolor='black')
ax.set_xlabel('Total Hours of Dreaming Sleep')
ax.set_ylabel('Frequency')
ax.set_title('Daily Dreaming Sleep in Mammal Species')
plt.show()

In [None]:
# Subset for danger categories
Danger_1 = Sleep.loc[Sleep['Danger'] == 1]
Danger_5 = Sleep.loc[Sleep['Danger'] == 5]

# View subsets
print(Danger_1.head())
print(Danger_5.head())

In [None]:
# Sort dataset
Sleep_sorted = Sleep.sort_values(by='Gest')
print(Sleep_sorted.head())

In [None]:
# Plot relationship
fig, ax = plt.subplots()
ax.plot(Sleep_sorted['Gest'], Sleep_sorted['Parasleep'], marker='o', linestyle='dashdot', color='b')
ax.set_xlabel('Gestational Time (days)')
ax.set_ylabel('Dreaming Sleep (hours)')
ax.set_title('Gestational Time vs. Dreaming Sleep in Mammals')
plt.show()

In [None]:
# Normalize danger categories
Danger_prop = Sleep['Danger'].value_counts(normalize=True)
Danger_pct = Danger_prop * 100
print(Danger_pct)

In [None]:
# Create new feature
Sleep['Short_life'] = Sleep['Life'] < 30

# Count plot
sns.catplot(x='Short_life', data=Sleep, kind='count', palette='muted')
plt.ylabel('Frequency')
plt.xlabel('Mammal Lifespan')
plt.title('Mammal Lifespan Categories')
plt.xticks(ticks=[0, 1], labels=['Lifespan >=30 years', 'Lifespan < 30 years'])
plt.show()

Results

The distribution of dreaming sleep varies widely among mammal species.

Mammals in different danger categories exhibit distinct sleep patterns.

Gestational time correlates inversely with dreaming sleep duration.

Most mammals have a lifespan shorter than 30 years.

Conclusion

This analysis provides insights into how mammalian sleep is influenced by ecological and physiological factors. Future work could explore predictive models using this dataset.