In [None]:
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns
import glob

sns.set(style="whitegrid")

# Automatically load the first CSV file found (cardiovascular dataset)
csv_files = glob.glob('*.csv')
df = pd.read_csv(csv_files[0])
df.head()

In [None]:
print("\nMissing Values Count:")
print(df.isnull().sum())

In [None]:
# Histogram of Age Distribution (change column if needed)
plt.figure(figsize=(8, 5))
sns.histplot(df[df.columns[0]], bins=30, kde=True, color='teal')
plt.title('Distribution of First Numerical Feature')
plt.xlabel(df.columns[0])
plt.ylabel('Count')
plt.show()

In [None]:
# Correlation Matrix (numerical features only)
plt.figure(figsize=(10, 6))
correlation = df.select_dtypes(include=['int64','float64']).corr()
sns.heatmap(correlation, annot=True, cmap='coolwarm', fmt=".2f")
plt.title('Correlation Matrix of Cardiovascular Features')
plt.show()

In [None]:
# Scatter Plot Between First Two Numerical Columns
num_cols = df.select_dtypes(include=['int64','float64']).columns

if len(num_cols) >= 2:
    plt.figure(figsize=(8, 5))
    sns.scatterplot(x=num_cols[0], y=num_cols[1], data=df, alpha=0.4)
    plt.title(f'{num_cols[0]} vs. {num_cols[1]}')
    plt.show()
else:
    print('Not enough numerical columns for scatter plot.')

In [None]:
print("Summary Statistics for Numerical Columns:")
display(df.describe())